dacorvo HF staff commited on
Commit
0548cd2
·
verified ·
1 Parent(s): 219c5fd

Update inference-cache-config/llama.json

Browse files
Files changed (1) hide show
  1. inference-cache-config/llama.json +8 -0
inference-cache-config/llama.json CHANGED
@@ -59,4 +59,12 @@
59
  "auto_cast_type": "bf16"
60
  }
61
  ],
 
 
 
 
 
 
 
 
62
  }
 
59
  "auto_cast_type": "bf16"
60
  }
61
  ],
62
+ "meta-llama/Meta-Llama-3-8B": [
63
+ {
64
+ "batch_size": 1,
65
+ "sequence_length": 4096,
66
+ "num_cores": 2,
67
+ "auto_cast_type": "bf16"
68
+ }
69
+ ]
70
  }