Kraken-LoRA / kraken_model /config.json
DavidGF's picture
Update kraken_model/config.json
7e9bd37 verified
{
"architectures": [
"KrakenForCausalLM"
],
"auto_map": {
"AutoConfig": "configuration_kraken_lora.KrakenConfig",
"AutoModel": "modeling_kraken_lora.KrakenForCausalLM",
"AutoModelForCausalLM": "modeling_kraken_lora.KrakenForCausalLM"
},
"config_dict": {
"class_indices": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2,
"LABEL_3": 3,
"LABEL_4": 4
},
"lora_adapters": {
"lora_expert1": "Llama-3-Smaug-8B-adapter",
"lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter",
"lora_expert3": "Llama-3-8B-Instruct-Coder-adapter",
"lora_expert4": "llama-3-sqlcoder-8b-adapter",
"lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter"
},
"model_type": "kraken",
"models": {
"base": "meta-llama/Meta-Llama-3-8B-Instruct"
},
"quantization": {
"base": null
},
"router": "../kraken_router",
"tokenizers": {
"lora_expert1": "Llama-3-Smaug-8B-adapter",
"lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter",
"lora_expert3": "Llama-3-8B-Instruct-Coder-adapter",
"lora_expert4": "llama-3-sqlcoder-8b-adapter",
"lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter"
}
},
"model_type": "kraken",
"torch_dtype": "bfloat16",
"transformers_version": "4.41.1"
}