{ "architectures": [ "KrakenForCausalLM" ], "auto_map": { "AutoConfig": "configuration_kraken_lora.KrakenConfig", "AutoModel": "modeling_kraken_lora.KrakenForCausalLM", "AutoModelForCausalLM": "modeling_kraken_lora.KrakenForCausalLM" }, "config_dict": { "class_indices": { "LABEL_0": 0, "LABEL_1": 1, "LABEL_2": 2, "LABEL_3": 3, "LABEL_4": 4 }, "lora_adapters": { "lora_expert1": "Llama-3-Smaug-8B-adapter", "lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter", "lora_expert3": "Llama-3-8B-Instruct-Coder-adapter", "lora_expert4": "llama-3-sqlcoder-8b-adapter", "lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter" }, "model_type": "kraken", "models": { "base": "meta-llama/Meta-Llama-3-8B-Instruct" }, "quantization": { "base": null }, "router": "../kraken_router", "tokenizers": { "lora_expert1": "Llama-3-Smaug-8B-adapter", "lora_expert2": "Meta-Llama-3-8B-Instruct-function-calling-json-mode-adapter", "lora_expert3": "Llama-3-8B-Instruct-Coder-adapter", "lora_expert4": "llama-3-sqlcoder-8b-adapter", "lora_expert5": "Llama-3-SauerkrautLM-8b-Instruct-adapter" } }, "model_type": "kraken", "torch_dtype": "bfloat16", "transformers_version": "4.41.1" }