Update inference-cache-config/Llama3.1-70b.json
Browse files
inference-cache-config/Llama3.1-70b.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"meta-llama/Llama-3.1-70B": [
|
3 |
{
|
4 |
"batch_size": 1,
|
5 |
"sequence_length": 4096,
|
|
|
1 |
{
|
2 |
+
"meta-llama/Llama-3.1-70B-Instruct": [
|
3 |
{
|
4 |
"batch_size": 1,
|
5 |
"sequence_length": 4096,
|