Set use_cache to True, otherwise inference performance is poor
Browse files- config.json +1 -1
config.json
CHANGED
@@ -19,6 +19,6 @@
|
|
19 |
"tie_word_embeddings": false,
|
20 |
"torch_dtype": "bfloat16",
|
21 |
"transformers_version": "4.30.0.dev0",
|
22 |
-
"use_cache":
|
23 |
"vocab_size": 32000
|
24 |
}
|
|
|
19 |
"tie_word_embeddings": false,
|
20 |
"torch_dtype": "bfloat16",
|
21 |
"transformers_version": "4.30.0.dev0",
|
22 |
+
"use_cache": true,
|
23 |
"vocab_size": 32000
|
24 |
}
|