microsoft-phi-1_5 / neurocache_config.json
Ali Safaya
upgrade neurocache weights
c396b6b
raw
history blame contribute delete
490 Bytes
{
"attention_layers": [
18,
19,
20,
21,
22,
23
],
"auto_mapping": null,
"base_model_name_or_path": "microsoft/phi-1_5",
"cache_dtype": "float16",
"cache_size": 262144,
"cache_type": "FIFO",
"compression_factor": 8,
"context_size": 2,
"global_cache": true,
"inference_mode": true,
"neighborhood_size": 2,
"neurocache_type": "ONDEVICE",
"retrieval_map": {
"18": 18
},
"similarity_fn": "l2",
"task_type": "CAUSAL_LM",
"topk": 8
}