tllama-0.13.0-hackcapecod / briton_config.pbtxt
pankajroark's picture
Upload folder using huggingface_hub
abfd696 verified
engine_path: "data"
hf_tokenizer: "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
kv_cache_free_gpu_mem_fraction: 0.9
enable_kv_cache_reuse: true
enable_chunked_context: False
port: 50051
fsm_cache_dir: "/cache/model/fsm_cache"
max_num_tokens: 8192
added_tokens {
tokens {
content: "<unk>"
single_word: False
lstrip: False
rstrip: False
normalized: False
special: True
}
tokens {
content: "<s>"
single_word: False
lstrip: False
rstrip: False
normalized: False
special: True
}
tokens {
content: "</s>"
single_word: False
lstrip: False
rstrip: False
normalized: False
special: True
}
}