Geaming commited on
Commit
2359650
1 Parent(s): 3aab1f1

Update config.json to align with tokenizer_config.json and other Qwen2.5 models

Browse files

![348c672dd5410f43b1126f729f6e8498.png](https://cdn-uploads.huggingface.co/production/uploads/6355eaf660c1b72f6269bc64/guVsibyawodWMO6Mdia-S.png)

Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -9,7 +9,7 @@
9
  "hidden_size": 2048,
10
  "initializer_range": 0.02,
11
  "intermediate_size": 11008,
12
- "max_position_embeddings": 32768,
13
  "max_window_layers": 36,
14
  "model_type": "qwen2",
15
  "num_attention_heads": 16,
@@ -17,7 +17,7 @@
17
  "num_key_value_heads": 2,
18
  "rms_norm_eps": 1e-06,
19
  "rope_theta": 1000000.0,
20
- "sliding_window": 32768,
21
  "tie_word_embeddings": true,
22
  "torch_dtype": "bfloat16",
23
  "transformers_version": "4.40.1",
 
9
  "hidden_size": 2048,
10
  "initializer_range": 0.02,
11
  "intermediate_size": 11008,
12
+ "max_position_embeddings": 131072,
13
  "max_window_layers": 36,
14
  "model_type": "qwen2",
15
  "num_attention_heads": 16,
 
17
  "num_key_value_heads": 2,
18
  "rms_norm_eps": 1e-06,
19
  "rope_theta": 1000000.0,
20
+ "sliding_window": 131072,
21
  "tie_word_embeddings": true,
22
  "torch_dtype": "bfloat16",
23
  "transformers_version": "4.40.1",