{ | |
"attention_layers": [ | |
18, | |
19, | |
20, | |
21, | |
22, | |
23 | |
], | |
"auto_mapping": null, | |
"base_model_name_or_path": "microsoft/phi-1_5", | |
"cache_dtype": "float16", | |
"cache_size": 262144, | |
"cache_type": "FIFO", | |
"compression_factor": 8, | |
"context_size": 2, | |
"global_cache": true, | |
"inference_mode": true, | |
"neighborhood_size": 2, | |
"neurocache_type": "ONDEVICE", | |
"retrieval_map": { | |
"18": 18 | |
}, | |
"similarity_fn": "l2", | |
"task_type": "CAUSAL_LM", | |
"topk": 8 | |
} |