Kraken-LoRA / kraken_model /config.json
DavidGF's picture
Upload folder using huggingface_hub
4898674 verified
raw
history blame
1.17 kB
{
"architectures": [
"KrakenForCausalLM"
],
"config_dict": {
"class_indices": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2,
"LABEL_3": 3,
"LABEL_4": 4
},
"lora_adapters": {
"lora_expert1": "Llama-3-Smaug-8B-adapter",
"lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter",
"lora_expert3": "Llama-3-8B-Instruct-Coder-adapter",
"lora_expert4": "llama-3-sqlcoder-8b-adapter",
"lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter"
},
"model_type": "kraken",
"models": {
"base": "meta-llama/Meta-Llama-3-8B-Instruct"
},
"quantization": {
"base": null
},
"router": "../kraken/kraken_router",
"tokenizers": {
"lora_expert1": "Llama-3-Smaug-8B-adapter",
"lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter",
"lora_expert3": "Llama-3-8B-Instruct-Coder-adapter",
"lora_expert4": "llama-3-sqlcoder-8b-adapter",
"lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter"
}
},
"model_type": "kraken",
"torch_dtype": "bfloat16",
"transformers_version": "4.41.1"
}