philschmid HF staff commited on
Commit
0694451
1 Parent(s): ed667f7

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. engines/config.json +2 -2
  2. engines/rank0.engine +2 -2
engines/config.json CHANGED
@@ -63,9 +63,9 @@
63
  "max_input_len": 8000,
64
  "max_seq_len": 8192,
65
  "opt_batch_size": 8,
66
- "max_batch_size": 32,
67
  "max_beam_width": 1,
68
- "max_num_tokens": 262144,
69
  "opt_num_tokens": null,
70
  "max_prompt_embedding_table_size": 0,
71
  "kv_cache_type": "PAGED",
 
63
  "max_input_len": 8000,
64
  "max_seq_len": 8192,
65
  "opt_batch_size": 8,
66
+ "max_batch_size": 8,
67
  "max_beam_width": 1,
68
+ "max_num_tokens": 65536,
69
  "opt_num_tokens": null,
70
  "max_prompt_embedding_table_size": 0,
71
  "kv_cache_type": "PAGED",
engines/rank0.engine CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9237017b5eba0f364725a5d1d67fd215793151dd4720acdd9e33dfd73aca9b1e
3
- size 16155886596
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df1fe24805ba9c3f1f650025f616f9df0e9455181784e81aab11de59aceed1c
3
+ size 16155880388