Ali Safaya commited on
Commit
7b89eff
·
1 Parent(s): a336651

initial commit

Browse files
Files changed (2) hide show
  1. neurocache_config.json +27 -0
  2. neurocache_model.bin +3 -0
neurocache_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "attention_layers": [
3
+ 18,
4
+ 19,
5
+ 20,
6
+ 21,
7
+ 22,
8
+ 23
9
+ ],
10
+ "auto_mapping": null,
11
+ "base_model_name_or_path": "microsoft/phi-1_5",
12
+ "cache_dtype": "bfloat16",
13
+ "cache_size": 16384,
14
+ "cache_type": "FIFO",
15
+ "compression_factor": 4,
16
+ "context_size": 2,
17
+ "global_cache": false,
18
+ "inference_mode": true,
19
+ "neighborhood_size": 2,
20
+ "neurocache_type": "ONDEVICE",
21
+ "retrieval_map": {
22
+ "18": 18
23
+ },
24
+ "similarity_fn": "l2",
25
+ "task_type": "CAUSAL_LM",
26
+ "topk": 16
27
+ }
neurocache_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c78724bf9a66ff01d7cf011b3054533103f6d65886e76bda7d329bbf3ffeaa2b
3
+ size 271603948