diff --git a/logs.txt b/logs.txt new file mode 100644 index 0000000000000000000000000000000000000000..bfd4be7f235c4dba741f00355bdbb1a8faf5a10d --- /dev/null +++ b/logs.txt @@ -0,0 +1,935 @@ +/home/cfruan/.conda/envs/mlc-source-311/bin/python -m mlc_llm gen_config /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct --quantization q3f16_1 --conv-template llama-3 --output /tmp/tmpbtropg_f --context-window-size 8192 --prefill-chunk-size 1024 +[2024-04-18 17:22:11] INFO auto_config.py:115: [92mFound[0m model configuration: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/config.json +[2024-04-18 17:22:11] INFO auto_config.py:153: [92mFound[0m model type: [1mllama[0m. Use `--model-type` to override. +[2024-04-18 17:22:11] INFO llama_model.py:52: [1mcontext_window_size[0m not found in config.json. Falling back to [1mmax_position_embeddings[0m (8192) +[2024-04-18 17:22:11] INFO llama_model.py:72: [1mprefill_chunk_size[0m defaults to [1mcontext_window_size[0m (8192) +[2024-04-18 17:22:11] INFO config.py:106: Overriding [1mcontext_window_size[0m from 8192 to 8192 +[2024-04-18 17:22:11] INFO config.py:106: Overriding [1mprefill_chunk_size[0m from 8192 to 1024 +[2024-04-18 17:22:11] INFO config.py:106: Overriding [1mmax_batch_size[0m from 1 to 80 +[2024-04-18 17:22:11] INFO gen_config.py:187: [generation_config.json] Setting [1mbos_token_id[0m: 128000 +[2024-04-18 17:22:11] INFO gen_config.py:187: [generation_config.json] Setting [1meos_token_id[0m: 128001 +[2024-04-18 17:22:11] INFO gen_config.py:201: [91mNot found[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/tokenizer.model +[2024-04-18 17:22:11] INFO gen_config.py:199: [92mFound[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/tokenizer.json. Copying to [1m/tmp/tmpbtropg_f/tokenizer.json[0m +[2024-04-18 17:22:11] INFO gen_config.py:201: [91mNot found[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/vocab.json +[2024-04-18 17:22:11] INFO gen_config.py:201: [91mNot found[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/merges.txt +[2024-04-18 17:22:11] INFO gen_config.py:201: [91mNot found[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/added_tokens.json +[2024-04-18 17:22:11] INFO gen_config.py:199: [92mFound[0m tokenizer config: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/tokenizer_config.json. Copying to [1m/tmp/tmpbtropg_f/tokenizer_config.json[0m +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mpad_token_id[0m: 0 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mtemperature[0m: 0.7 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mpresence_penalty[0m: 0.0 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mfrequency_penalty[0m: 0.0 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mrepetition_penalty[0m: 1.0 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mtop_p[0m: 0.95 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mmean_gen_len[0m: 128 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mmax_gen_len[0m: 512 +[2024-04-18 17:22:11] INFO gen_config.py:76: [System default] Setting [1mshift_fill_factor[0m: 0.3 +[2024-04-18 17:22:11] INFO gen_config.py:263: Dumping configuration file to: [1m/tmp/tmpbtropg_f/mlc-chat-config.json[0m +/home/cfruan/.conda/envs/mlc-source-311/bin/python -m mlc_llm convert_weight /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct --quantization q3f16_1 --source-format auto --output /tmp/tmpbtropg_f +[2024-04-18 17:22:13] INFO auto_config.py:115: [92mFound[0m model configuration: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/config.json +[2024-04-18 17:22:14] INFO auto_device.py:76: [92mFound[0m device: cuda:0 +[2024-04-18 17:22:14] INFO auto_device.py:76: [92mFound[0m device: cuda:1 +[2024-04-18 17:22:15] INFO auto_device.py:85: [91mNot found[0m device: rocm:0 +[2024-04-18 17:22:16] INFO auto_device.py:85: [91mNot found[0m device: metal:0 +[2024-04-18 17:22:17] INFO auto_device.py:76: [92mFound[0m device: vulkan:0 +[2024-04-18 17:22:17] INFO auto_device.py:76: [92mFound[0m device: vulkan:1 +[2024-04-18 17:22:17] INFO auto_device.py:76: [92mFound[0m device: vulkan:2 +[2024-04-18 17:22:19] INFO auto_device.py:85: [91mNot found[0m device: opencl:0 +[2024-04-18 17:22:19] INFO auto_device.py:33: Using device: [1mcuda:0[0m +[2024-04-18 17:22:19] INFO auto_weight.py:70: Finding weights in: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct +[2024-04-18 17:22:19] INFO auto_weight.py:136: [91mNot found[0m Huggingface PyTorch +[2024-04-18 17:22:19] INFO auto_weight.py:143: [92mFound[0m source weight format: huggingface-safetensor. Source configuration: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model.safetensors.index.json +[2024-04-18 17:22:19] INFO auto_weight.py:106: Using source weight configuration: [1m/ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model.safetensors.index.json[0m. Use `--source` to override. +[2024-04-18 17:22:19] INFO auto_weight.py:110: Using source weight format: [1mhuggingface-safetensor[0m. Use `--source-format` to override. +[2024-04-18 17:22:19] INFO auto_config.py:153: [92mFound[0m model type: [1mllama[0m. Use `--model-type` to override. +[2024-04-18 17:22:19] INFO llama_model.py:52: [1mcontext_window_size[0m not found in config.json. Falling back to [1mmax_position_embeddings[0m (8192) +[2024-04-18 17:22:19] INFO llama_model.py:72: [1mprefill_chunk_size[0m defaults to [1mcontext_window_size[0m (8192) +[1mWeight conversion with arguments:[0m + [1m--config[0m /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/config.json + [1m--quantization[0m GroupQuantize(name='q3f16_1', kind='group-quant', group_size=40, quantize_dtype='int3', storage_dtype='uint32', model_dtype='float16', linear_weight_layout='NK', quantize_embedding=True, quantize_final_fc=True, num_elem_per_storage=10, num_storage_per_group=4, max_int_value=3) + [1m--model-type[0m llama + [1m--device[0m cuda:0 + [1m--source[0m /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model.safetensors.index.json + [1m--source-format[0m huggingface-safetensor + [1m--output[0m /tmp/tmpbtropg_f +Start storing to cache /tmp/tmpbtropg_f + 0%| | 0/483 [00:00, ?it/s] [2024-04-18 17:22:39] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00030-of-00030.safetensors + 0%| | 0/483 [00:00, ?it/s] [2024-04-18 17:22:56] INFO group_quantization.py:217: Compiling quantize function for key: ((128256, 8192), float16, cuda, axis=1, output_transpose=False) + 0%| | 0/483 [00:16, ?it/s] [2024-04-18 17:22:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mlm_head.q_weight[0m", shape: (128256, 820), dtype: uint32 + 0%| | 0/483 [00:17, ?it/s] [2024-04-18 17:22:58] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mlm_head.q_scale[0m", shape: (128256, 205), dtype: float16 + 0%| | 0/483 [00:18, ?it/s] 0%|▎ | 1/483 [00:19<2:33:13, 19.07s/it] [2024-04-18 17:22:58] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00030-of-00030.safetensors + 0%|▎ | 1/483 [00:19<2:33:13, 19.07s/it] [2024-04-18 17:22:58] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00001-of-00030.safetensors + 0%|▎ | 1/483 [00:19<2:33:13, 19.07s/it] [2024-04-18 17:23:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.embed_tokens.q_weight[0m", shape: (128256, 820), dtype: uint32 + 0%|▎ | 1/483 [00:33<2:33:13, 19.07s/it] [2024-04-18 17:23:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.embed_tokens.q_scale[0m", shape: (128256, 205), dtype: float16 + 0%|▎ | 1/483 [00:35<2:33:13, 19.07s/it] 0%|▌ | 2/483 [00:35<2:22:32, 17.78s/it] [2024-04-18 17:23:15] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.0.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 0%|▌ | 2/483 [00:35<2:22:32, 17.78s/it] [2024-04-18 17:23:16] INFO group_quantization.py:217: Compiling quantize function for key: ((8192, 28672), float16, cuda, axis=1, output_transpose=False) + 0%|▌ | 2/483 [00:37<2:22:32, 17.78s/it] [2024-04-18 17:23:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 0%|▌ | 2/483 [00:37<2:22:32, 17.78s/it] [2024-04-18 17:23:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 0%|▌ | 2/483 [00:37<2:22:32, 17.78s/it] 1%|█▏ | 4/483 [00:37<57:40, 7.22s/it] [2024-04-18 17:23:21] INFO group_quantization.py:217: Compiling quantize function for key: ((57344, 8192), float16, cuda, axis=1, output_transpose=False) + 1%|█▏ | 4/483 [00:42<57:40, 7.22s/it] [2024-04-18 17:23:22] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 1%|█▏ | 4/483 [00:42<57:40, 7.22s/it] [2024-04-18 17:23:22] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 1%|█▏ | 4/483 [00:42<57:40, 7.22s/it] 1%|█▌ | 5/483 [00:43<52:33, 6.60s/it] [2024-04-18 17:23:22] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.0.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 1%|█▌ | 5/483 [00:43<52:33, 6.60s/it] [2024-04-18 17:23:23] INFO group_quantization.py:217: Compiling quantize function for key: ((10240, 8192), float16, cuda, axis=1, output_transpose=False) + 1%|█▌ | 5/483 [00:43<52:33, 6.60s/it] [2024-04-18 17:23:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 1%|█▌ | 5/483 [00:44<52:33, 6.60s/it] [2024-04-18 17:23:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 1%|█▌ | 5/483 [00:44<52:33, 6.60s/it] 1%|██ | 7/483 [00:44<29:54, 3.77s/it] [2024-04-18 17:23:24] INFO group_quantization.py:217: Compiling quantize function for key: ((8192, 8192), float16, cuda, axis=1, output_transpose=False) + 1%|██ | 7/483 [00:44<29:54, 3.77s/it] [2024-04-18 17:23:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 1%|██ | 7/483 [00:44<29:54, 3.77s/it] [2024-04-18 17:23:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.0.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 1%|██ | 7/483 [00:44<29:54, 3.77s/it] 2%|██▍ | 8/483 [00:44<23:50, 3.01s/it] [2024-04-18 17:23:24] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00002-of-00030.safetensors + 2%|██▍ | 8/483 [00:44<23:50, 3.01s/it] [2024-04-18 17:23:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 2%|██▍ | 8/483 [00:57<23:50, 3.01s/it] [2024-04-18 17:23:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 2%|██▍ | 8/483 [00:58<23:50, 3.01s/it] 2%|██▋ | 9/483 [00:58<46:19, 5.86s/it] [2024-04-18 17:23:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 2%|██▋ | 9/483 [01:00<46:19, 5.86s/it] [2024-04-18 17:23:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 2%|██▋ | 9/483 [01:00<46:19, 5.86s/it] 2%|███ | 10/483 [01:00<36:30, 4.63s/it] [2024-04-18 17:23:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 2%|███ | 10/483 [01:00<36:30, 4.63s/it] [2024-04-18 17:23:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 2%|███ | 10/483 [01:00<36:30, 4.63s/it] 2%|███▎ | 11/483 [01:00<26:58, 3.43s/it] [2024-04-18 17:23:40] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.1.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 2%|███▎ | 11/483 [01:00<26:58, 3.43s/it] [2024-04-18 17:23:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 2%|███▎ | 11/483 [01:01<26:58, 3.43s/it] [2024-04-18 17:23:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.1.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 2%|███▎ | 11/483 [01:01<26:58, 3.43s/it] 3%|███▉ | 13/483 [01:01<17:25, 2.23s/it] [2024-04-18 17:23:41] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.1.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 3%|███▉ | 13/483 [01:01<17:25, 2.23s/it] [2024-04-18 17:23:41] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.2.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 3%|███▉ | 13/483 [01:01<17:25, 2.23s/it] [2024-04-18 17:23:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 3%|███▉ | 13/483 [01:03<17:25, 2.23s/it] [2024-04-18 17:23:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 3%|███▉ | 13/483 [01:03<17:25, 2.23s/it] 3%|████▊ | 16/483 [01:03<10:38, 1.37s/it] [2024-04-18 17:23:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 3%|████▊ | 16/483 [01:07<10:38, 1.37s/it] [2024-04-18 17:23:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 3%|████▊ | 16/483 [01:07<10:38, 1.37s/it] 4%|█████ | 17/483 [01:08<15:34, 2.01s/it] [2024-04-18 17:23:47] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.2.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 4%|█████ | 17/483 [01:08<15:34, 2.01s/it] [2024-04-18 17:23:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 4%|█████ | 17/483 [01:08<15:34, 2.01s/it] [2024-04-18 17:23:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 4%|█████ | 17/483 [01:08<15:34, 2.01s/it] 4%|█████▋ | 19/483 [01:08<11:14, 1.45s/it] [2024-04-18 17:23:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 4%|█████▋ | 19/483 [01:09<11:14, 1.45s/it] [2024-04-18 17:23:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.2.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 4%|█████▋ | 19/483 [01:09<11:14, 1.45s/it] 4%|██████ | 20/483 [01:09<09:30, 1.23s/it] [2024-04-18 17:23:49] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.3.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 4%|██████ | 20/483 [01:09<09:30, 1.23s/it] [2024-04-18 17:23:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 4%|██████ | 20/483 [01:10<09:30, 1.23s/it] [2024-04-18 17:23:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 4%|██████ | 20/483 [01:10<09:30, 1.23s/it] 5%|██████▌ | 22/483 [01:10<08:06, 1.05s/it] [2024-04-18 17:23:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 5%|██████▌ | 22/483 [01:14<08:06, 1.05s/it] [2024-04-18 17:23:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 5%|██████▌ | 22/483 [01:15<08:06, 1.05s/it] 5%|██████▉ | 23/483 [01:15<13:15, 1.73s/it] [2024-04-18 17:23:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.3.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 5%|██████▉ | 23/483 [01:15<13:15, 1.73s/it] [2024-04-18 17:23:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 5%|██████▉ | 23/483 [01:15<13:15, 1.73s/it] [2024-04-18 17:23:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 5%|██████▉ | 23/483 [01:15<13:15, 1.73s/it] 5%|███████▌ | 25/483 [01:15<09:26, 1.24s/it] [2024-04-18 17:23:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 5%|███████▌ | 25/483 [01:16<09:26, 1.24s/it] [2024-04-18 17:23:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.3.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 5%|███████▌ | 25/483 [01:16<09:26, 1.24s/it] 5%|███████▊ | 26/483 [01:16<07:59, 1.05s/it] [2024-04-18 17:23:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 5%|███████▊ | 26/483 [01:16<07:59, 1.05s/it] [2024-04-18 17:23:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 5%|███████▊ | 26/483 [01:16<07:59, 1.05s/it] 6%|████████ | 27/483 [01:16<07:22, 1.03it/s] [2024-04-18 17:23:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 6%|████████ | 27/483 [01:17<07:22, 1.03it/s] [2024-04-18 17:23:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 6%|████████ | 27/483 [01:17<07:22, 1.03it/s] 6%|████████▍ | 28/483 [01:17<06:12, 1.22it/s] [2024-04-18 17:23:57] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00002-of-00030.safetensors + 6%|████████▍ | 28/483 [01:17<06:12, 1.22it/s] [2024-04-18 17:23:57] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00001-of-00030.safetensors + 6%|████████▍ | 28/483 [01:17<06:12, 1.22it/s] [2024-04-18 17:23:57] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00005-of-00030.safetensors + 6%|████████▍ | 28/483 [01:18<06:12, 1.22it/s] [2024-04-18 17:24:06] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.10.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 6%|████████▍ | 28/483 [01:26<06:12, 1.22it/s] 6%|████████▋ | 29/483 [01:26<23:43, 3.13s/it] [2024-04-18 17:24:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 6%|████████▋ | 29/483 [01:30<23:43, 3.13s/it] [2024-04-18 17:24:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 6%|████████▋ | 29/483 [01:30<23:43, 3.13s/it] 6%|█████████ | 30/483 [01:30<25:14, 3.34s/it] [2024-04-18 17:24:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 6%|█████████ | 30/483 [01:36<25:14, 3.34s/it] [2024-04-18 17:24:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 6%|█████████ | 30/483 [01:37<25:14, 3.34s/it] 6%|█████████▎ | 31/483 [01:37<31:48, 4.22s/it] [2024-04-18 17:24:17] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.10.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 6%|█████████▎ | 31/483 [01:37<31:48, 4.22s/it] [2024-04-18 17:24:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 6%|█████████▎ | 31/483 [01:38<31:48, 4.22s/it] [2024-04-18 17:24:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 6%|█████████▎ | 31/483 [01:38<31:48, 4.22s/it] 7%|█████████▉ | 33/483 [01:38<19:46, 2.64s/it] [2024-04-18 17:24:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 7%|█████████▉ | 33/483 [01:38<19:46, 2.64s/it] [2024-04-18 17:24:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.10.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 7%|█████████▉ | 33/483 [01:39<19:46, 2.64s/it] 7%|██████████▏ | 34/483 [01:39<15:35, 2.08s/it] [2024-04-18 17:24:18] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.11.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 7%|██████████▏ | 34/483 [01:39<15:35, 2.08s/it] [2024-04-18 17:24:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 7%|██████████▏ | 34/483 [01:40<15:35, 2.08s/it] [2024-04-18 17:24:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 7%|██████████▏ | 34/483 [01:40<15:35, 2.08s/it] 7%|██████████▊ | 36/483 [01:40<11:24, 1.53s/it] [2024-04-18 17:24:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 7%|██████████▊ | 36/483 [01:45<11:24, 1.53s/it] [2024-04-18 17:24:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 7%|██████████▊ | 36/483 [01:46<11:24, 1.53s/it] 8%|███████████ | 37/483 [01:46<19:00, 2.56s/it] [2024-04-18 17:24:26] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.11.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 8%|███████████ | 37/483 [01:46<19:00, 2.56s/it] [2024-04-18 17:24:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 8%|███████████ | 37/483 [01:47<19:00, 2.56s/it] [2024-04-18 17:24:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 8%|███████████ | 37/483 [01:47<19:00, 2.56s/it] 8%|███████████▋ | 39/483 [01:47<13:17, 1.80s/it] [2024-04-18 17:24:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 8%|███████████▋ | 39/483 [01:48<13:17, 1.80s/it] [2024-04-18 17:24:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.11.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 8%|███████████▋ | 39/483 [01:48<13:17, 1.80s/it] 8%|████████████ | 40/483 [01:48<10:56, 1.48s/it] [2024-04-18 17:24:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 8%|████████████ | 40/483 [01:53<10:56, 1.48s/it] [2024-04-18 17:24:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 8%|████████████ | 40/483 [01:53<10:56, 1.48s/it] 8%|████████████▎ | 41/483 [01:53<18:09, 2.47s/it] [2024-04-18 17:24:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 8%|████████████▎ | 41/483 [01:54<18:09, 2.47s/it] [2024-04-18 17:24:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 8%|████████████▎ | 41/483 [01:54<18:09, 2.47s/it] 9%|████████████▌ | 42/483 [01:54<15:17, 2.08s/it] [2024-04-18 17:24:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 9%|████████████▌ | 42/483 [01:54<15:17, 2.08s/it] [2024-04-18 17:24:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 9%|████████████▌ | 42/483 [01:55<15:17, 2.08s/it] 9%|████████████▉ | 43/483 [01:55<11:58, 1.63s/it] [2024-04-18 17:24:34] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00005-of-00030.safetensors + 9%|████████████▉ | 43/483 [01:55<11:58, 1.63s/it] [2024-04-18 17:24:35] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00006-of-00030.safetensors + 9%|████████████▉ | 43/483 [01:55<11:58, 1.63s/it] [2024-04-18 17:24:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.12.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 9%|████████████▉ | 43/483 [02:04<11:58, 1.63s/it] 9%|█████████████▏ | 44/483 [02:04<27:56, 3.82s/it] [2024-04-18 17:24:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 9%|█████████████▏ | 44/483 [02:06<27:56, 3.82s/it] [2024-04-18 17:24:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.12.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 9%|█████████████▏ | 44/483 [02:06<27:56, 3.82s/it] 9%|█████████████▌ | 45/483 [02:06<23:32, 3.22s/it] [2024-04-18 17:24:46] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.12.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 9%|█████████████▌ | 45/483 [02:06<23:32, 3.22s/it] [2024-04-18 17:24:46] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.13.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 9%|█████████████▌ | 45/483 [02:06<23:32, 3.22s/it] [2024-04-18 17:24:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 9%|█████████████▌ | 45/483 [02:07<23:32, 3.22s/it] [2024-04-18 17:24:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 9%|█████████████▌ | 45/483 [02:07<23:32, 3.22s/it] 10%|██████████████▍ | 48/483 [02:08<12:43, 1.76s/it] [2024-04-18 17:24:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 10%|██████████████▍ | 48/483 [02:12<12:43, 1.76s/it] [2024-04-18 17:24:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 10%|██████████████▍ | 48/483 [02:13<12:43, 1.76s/it] 10%|██████████████▋ | 49/483 [02:13<18:12, 2.52s/it] [2024-04-18 17:24:53] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.13.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 10%|██████████████▋ | 49/483 [02:13<18:12, 2.52s/it] [2024-04-18 17:24:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 10%|██████████████▋ | 49/483 [02:14<18:12, 2.52s/it] [2024-04-18 17:24:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 10%|██████████████▋ | 49/483 [02:14<18:12, 2.52s/it] 11%|███████████████▎ | 51/483 [02:14<12:50, 1.78s/it] [2024-04-18 17:24:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 11%|███████████████▎ | 51/483 [02:14<12:50, 1.78s/it] [2024-04-18 17:24:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.13.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 11%|███████████████▎ | 51/483 [02:14<12:50, 1.78s/it] 11%|███████████████▌ | 52/483 [02:14<10:43, 1.49s/it] [2024-04-18 17:24:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.14.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 11%|███████████████▌ | 52/483 [02:14<10:43, 1.49s/it] [2024-04-18 17:24:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 11%|███████████████▌ | 52/483 [02:16<10:43, 1.49s/it] [2024-04-18 17:24:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 11%|███████████████▌ | 52/483 [02:16<10:43, 1.49s/it] 11%|████████████████▏ | 54/483 [02:16<08:35, 1.20s/it] [2024-04-18 17:25:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 11%|████████████████▏ | 54/483 [02:20<08:35, 1.20s/it] [2024-04-18 17:25:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 11%|████████████████▏ | 54/483 [02:20<08:35, 1.20s/it] 11%|████████████████▌ | 55/483 [02:20<13:34, 1.90s/it] [2024-04-18 17:25:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.14.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 11%|████████████████▌ | 55/483 [02:20<13:34, 1.90s/it] [2024-04-18 17:25:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 11%|████████████████▌ | 55/483 [02:21<13:34, 1.90s/it] [2024-04-18 17:25:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 11%|████████████████▌ | 55/483 [02:21<13:34, 1.90s/it] 12%|█████████████████ | 57/483 [02:21<09:16, 1.31s/it] [2024-04-18 17:25:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 12%|█████████████████ | 57/483 [02:21<09:16, 1.31s/it] [2024-04-18 17:25:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.14.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 12%|█████████████████ | 57/483 [02:21<09:16, 1.31s/it] 12%|█████████████████▍ | 58/483 [02:21<07:50, 1.11s/it] [2024-04-18 17:25:01] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00007-of-00030.safetensors + 12%|█████████████████▍ | 58/483 [02:21<07:50, 1.11s/it] [2024-04-18 17:25:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 12%|█████████████████▍ | 58/483 [02:36<07:50, 1.11s/it] [2024-04-18 17:25:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 12%|█████████████████▍ | 58/483 [02:38<07:50, 1.11s/it] 12%|█████████████████▋ | 59/483 [02:38<32:54, 4.66s/it] [2024-04-18 17:25:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 12%|█████████████████▋ | 59/483 [02:39<32:54, 4.66s/it] [2024-04-18 17:25:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 12%|█████████████████▋ | 59/483 [02:39<32:54, 4.66s/it] 12%|██████████████████ | 60/483 [02:39<26:27, 3.75s/it] [2024-04-18 17:25:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 12%|██████████████████ | 60/483 [02:39<26:27, 3.75s/it] [2024-04-18 17:25:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 12%|██████████████████ | 60/483 [02:39<26:27, 3.75s/it] 13%|██████████████████▎ | 61/483 [02:39<20:16, 2.88s/it] [2024-04-18 17:25:19] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.15.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 13%|██████████████████▎ | 61/483 [02:39<20:16, 2.88s/it] [2024-04-18 17:25:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 13%|██████████████████▎ | 61/483 [02:41<20:16, 2.88s/it] [2024-04-18 17:25:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.15.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 13%|██████████████████▎ | 61/483 [02:41<20:16, 2.88s/it] 13%|██████████████████▉ | 63/483 [02:42<15:01, 2.15s/it] [2024-04-18 17:25:21] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.15.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 13%|██████████████████▉ | 63/483 [02:42<15:01, 2.15s/it] [2024-04-18 17:25:21] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.16.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 13%|██████████████████▉ | 63/483 [02:42<15:01, 2.15s/it] [2024-04-18 17:25:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 13%|██████████████████▉ | 63/483 [02:43<15:01, 2.15s/it] [2024-04-18 17:25:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 13%|██████████████████▉ | 63/483 [02:43<15:01, 2.15s/it] 14%|███████████████████▊ | 66/483 [02:43<09:42, 1.40s/it] [2024-04-18 17:25:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 14%|███████████████████▊ | 66/483 [02:48<09:42, 1.40s/it] [2024-04-18 17:25:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 14%|███████████████████▊ | 66/483 [02:48<09:42, 1.40s/it] 14%|████████████████████ | 67/483 [02:48<14:23, 2.07s/it] [2024-04-18 17:25:28] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.16.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 14%|████████████████████ | 67/483 [02:48<14:23, 2.07s/it] [2024-04-18 17:25:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 14%|████████████████████ | 67/483 [02:49<14:23, 2.07s/it] [2024-04-18 17:25:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 14%|████████████████████ | 67/483 [02:49<14:23, 2.07s/it] 14%|████████████████████▋ | 69/483 [02:49<10:31, 1.53s/it] [2024-04-18 17:25:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 14%|████████████████████▋ | 69/483 [02:50<10:31, 1.53s/it] [2024-04-18 17:25:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.16.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 14%|████████████████████▋ | 69/483 [02:50<10:31, 1.53s/it] 14%|█████████████████████ | 70/483 [02:50<09:09, 1.33s/it] [2024-04-18 17:25:30] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.17.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 14%|█████████████████████ | 70/483 [02:50<09:09, 1.33s/it] [2024-04-18 17:25:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 14%|█████████████████████ | 70/483 [02:51<09:09, 1.33s/it] [2024-04-18 17:25:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 14%|█████████████████████ | 70/483 [02:52<09:09, 1.33s/it] 15%|█████████████████████▌ | 72/483 [02:52<08:03, 1.18s/it] [2024-04-18 17:25:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 15%|█████████████████████▌ | 72/483 [02:57<08:03, 1.18s/it] [2024-04-18 17:25:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 15%|█████████████████████▌ | 72/483 [02:58<08:03, 1.18s/it] 15%|█████████████████████▉ | 73/483 [02:58<15:05, 2.21s/it] [2024-04-18 17:25:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.17.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 15%|█████████████████████▉ | 73/483 [02:58<15:05, 2.21s/it] [2024-04-18 17:25:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 15%|█████████████████████▉ | 73/483 [02:59<15:05, 2.21s/it] [2024-04-18 17:25:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 15%|█████████████████████▉ | 73/483 [02:59<15:05, 2.21s/it] 16%|██████████████████████▌ | 75/483 [02:59<10:36, 1.56s/it] [2024-04-18 17:25:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 16%|██████████████████████▌ | 75/483 [02:59<10:36, 1.56s/it] [2024-04-18 17:25:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.17.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 16%|██████████████████████▌ | 75/483 [02:59<10:36, 1.56s/it] 16%|██████████████████████▊ | 76/483 [02:59<08:56, 1.32s/it] [2024-04-18 17:25:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 16%|██████████████████████▊ | 76/483 [03:00<08:56, 1.32s/it] [2024-04-18 17:25:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 16%|██████████████████████▊ | 76/483 [03:00<08:56, 1.32s/it] 16%|███████████████████████ | 77/483 [03:00<08:07, 1.20s/it] [2024-04-18 17:25:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 16%|███████████████████████ | 77/483 [03:00<08:07, 1.20s/it] [2024-04-18 17:25:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 16%|███████████████████████ | 77/483 [03:00<08:07, 1.20s/it] 16%|███████████████████████▍ | 78/483 [03:00<06:44, 1.00it/s] [2024-04-18 17:25:40] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00006-of-00030.safetensors + 16%|███████████████████████▍ | 78/483 [03:00<06:44, 1.00it/s] [2024-04-18 17:25:41] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00007-of-00030.safetensors + 16%|███████████████████████▍ | 78/483 [03:01<06:44, 1.00it/s] [2024-04-18 17:25:41] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00008-of-00030.safetensors + 16%|███████████████████████▍ | 78/483 [03:01<06:44, 1.00it/s] [2024-04-18 17:25:51] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.18.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 16%|███████████████████████▍ | 78/483 [03:11<06:44, 1.00it/s] 16%|███████████████████████▋ | 79/483 [03:11<24:01, 3.57s/it] [2024-04-18 17:25:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 16%|███████████████████████▋ | 79/483 [03:14<24:01, 3.57s/it] [2024-04-18 17:25:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 16%|███████████████████████▋ | 79/483 [03:14<24:01, 3.57s/it] 17%|████████████████████████ | 80/483 [03:14<22:47, 3.39s/it] [2024-04-18 17:25:59] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 17%|████████████████████████ | 80/483 [03:19<22:47, 3.39s/it] [2024-04-18 17:25:59] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.18.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 17%|████████████████████████ | 80/483 [03:20<22:47, 3.39s/it] 17%|████████████████████████▎ | 81/483 [03:20<26:49, 4.00s/it] [2024-04-18 17:26:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.18.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 17%|████████████████████████▎ | 81/483 [03:20<26:49, 4.00s/it] [2024-04-18 17:26:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.19.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 17%|████████████████████████▎ | 81/483 [03:20<26:49, 4.00s/it] [2024-04-18 17:26:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 17%|████████████████████████▎ | 81/483 [03:21<26:49, 4.00s/it] [2024-04-18 17:26:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 17%|████████████████████████▎ | 81/483 [03:21<26:49, 4.00s/it] 17%|█████████████████████████▏ | 84/483 [03:21<14:12, 2.14s/it] [2024-04-18 17:26:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 17%|█████████████████████████▏ | 84/483 [03:26<14:12, 2.14s/it] [2024-04-18 17:26:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 17%|█████████████████████████▏ | 84/483 [03:27<14:12, 2.14s/it] 18%|█████████████████████████▌ | 85/483 [03:27<18:54, 2.85s/it] [2024-04-18 17:26:07] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.19.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 18%|█████████████████████████▌ | 85/483 [03:27<18:54, 2.85s/it] [2024-04-18 17:26:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 18%|█████████████████████████▌ | 85/483 [03:28<18:54, 2.85s/it] [2024-04-18 17:26:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 18%|█████████████████████████▌ | 85/483 [03:28<18:54, 2.85s/it] 18%|██████████████████████████ | 87/483 [03:28<12:55, 1.96s/it] [2024-04-18 17:26:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 18%|██████████████████████████ | 87/483 [03:29<12:55, 1.96s/it] [2024-04-18 17:26:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.19.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 18%|██████████████████████████ | 87/483 [03:29<12:55, 1.96s/it] 18%|██████████████████████████▍ | 88/483 [03:29<11:12, 1.70s/it] [2024-04-18 17:26:08] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.20.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 18%|██████████████████████████▍ | 88/483 [03:29<11:12, 1.70s/it] [2024-04-18 17:26:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 18%|██████████████████████████▍ | 88/483 [03:30<11:12, 1.70s/it] [2024-04-18 17:26:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 18%|██████████████████████████▍ | 88/483 [03:31<11:12, 1.70s/it] 19%|███████████████████████████ | 90/483 [03:31<09:24, 1.44s/it] [2024-04-18 17:26:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 19%|███████████████████████████ | 90/483 [03:35<09:24, 1.44s/it] [2024-04-18 17:26:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 19%|███████████████████████████ | 90/483 [03:36<09:24, 1.44s/it] 19%|███████████████████████████▎ | 91/483 [03:36<14:53, 2.28s/it] [2024-04-18 17:26:16] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.20.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 19%|███████████████████████████▎ | 91/483 [03:36<14:53, 2.28s/it] [2024-04-18 17:26:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 19%|███████████████████████████▎ | 91/483 [03:37<14:53, 2.28s/it] [2024-04-18 17:26:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 19%|███████████████████████████▎ | 91/483 [03:37<14:53, 2.28s/it] 19%|███████████████████████████▉ | 93/483 [03:37<10:37, 1.63s/it] [2024-04-18 17:26:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 19%|███████████████████████████▉ | 93/483 [03:38<10:37, 1.63s/it] [2024-04-18 17:26:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.20.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 19%|███████████████████████████▉ | 93/483 [03:38<10:37, 1.63s/it] 19%|████████████████████████████▏ | 94/483 [03:38<08:59, 1.39s/it] [2024-04-18 17:26:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 19%|████████████████████████████▏ | 94/483 [03:38<08:59, 1.39s/it] [2024-04-18 17:26:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 19%|████████████████████████████▏ | 94/483 [03:39<08:59, 1.39s/it] 20%|████████████████████████████▌ | 95/483 [03:39<08:07, 1.26s/it] [2024-04-18 17:26:18] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00008-of-00030.safetensors + 20%|████████████████████████████▌ | 95/483 [03:39<08:07, 1.26s/it] [2024-04-18 17:26:19] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00009-of-00030.safetensors + 20%|████████████████████████████▌ | 95/483 [03:39<08:07, 1.26s/it] [2024-04-18 17:26:28] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.21.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 20%|████████████████████████████▌ | 95/483 [03:49<08:07, 1.26s/it] 20%|████████████████████████████▊ | 96/483 [03:49<22:19, 3.46s/it] [2024-04-18 17:26:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 20%|████████████████████████████▊ | 96/483 [03:50<22:19, 3.46s/it] [2024-04-18 17:26:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 20%|████████████████████████████▊ | 96/483 [03:51<22:19, 3.46s/it] 20%|█████████████████████████████ | 97/483 [03:51<19:58, 3.10s/it] [2024-04-18 17:26:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 20%|█████████████████████████████ | 97/483 [03:55<19:58, 3.10s/it] [2024-04-18 17:26:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 20%|█████████████████████████████ | 97/483 [03:56<19:58, 3.10s/it] 20%|█████████████████████████████▍ | 98/483 [03:56<23:46, 3.71s/it] [2024-04-18 17:26:36] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.21.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 20%|█████████████████████████████▍ | 98/483 [03:56<23:46, 3.71s/it] [2024-04-18 17:26:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 20%|█████████████████████████████▍ | 98/483 [03:56<23:46, 3.71s/it] [2024-04-18 17:26:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.21.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 20%|█████████████████████████████▍ | 98/483 [03:56<23:46, 3.71s/it] 21%|█████████████████████████████▊ | 100/483 [03:56<13:51, 2.17s/it] [2024-04-18 17:26:36] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.22.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 21%|█████████████████████████████▊ | 100/483 [03:56<13:51, 2.17s/it] [2024-04-18 17:26:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 21%|█████████████████████████████▊ | 100/483 [03:58<13:51, 2.17s/it] [2024-04-18 17:26:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 21%|█████████████████████████████▊ | 100/483 [03:58<13:51, 2.17s/it] 21%|██████████████████████████████▍ | 102/483 [03:58<10:48, 1.70s/it] [2024-04-18 17:26:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 21%|██████████████████████████████▍ | 102/483 [04:03<10:48, 1.70s/it] [2024-04-18 17:26:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 21%|██████████████████████████████▍ | 102/483 [04:04<10:48, 1.70s/it] 21%|██████████████████████████████▋ | 103/483 [04:04<15:58, 2.52s/it] [2024-04-18 17:26:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.22.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 21%|██████████████████████████████▋ | 103/483 [04:04<15:58, 2.52s/it] [2024-04-18 17:26:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 21%|██████████████████████████████▋ | 103/483 [04:05<15:58, 2.52s/it] [2024-04-18 17:26:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 21%|██████████████████████████████▋ | 103/483 [04:05<15:58, 2.52s/it] 22%|███████████████████████████████▎ | 105/483 [04:05<11:27, 1.82s/it] [2024-04-18 17:26:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 22%|███████████████████████████████▎ | 105/483 [04:06<11:27, 1.82s/it] [2024-04-18 17:26:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.22.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 22%|███████████████████████████████▎ | 105/483 [04:06<11:27, 1.82s/it] 22%|███████████████████████████████▌ | 106/483 [04:06<09:45, 1.55s/it] [2024-04-18 17:26:46] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.23.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 22%|███████████████████████████████▌ | 106/483 [04:06<09:45, 1.55s/it] [2024-04-18 17:26:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 22%|███████████████████████████████▌ | 106/483 [04:07<09:45, 1.55s/it] [2024-04-18 17:26:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 22%|███████████████████████████████▌ | 106/483 [04:08<09:45, 1.55s/it] 22%|████████████████████████████████▏ | 108/483 [04:08<08:21, 1.34s/it] [2024-04-18 17:26:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 22%|████████████████████████████████▏ | 108/483 [04:12<08:21, 1.34s/it] [2024-04-18 17:26:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 22%|████████████████████████████████▏ | 108/483 [04:13<08:21, 1.34s/it] 23%|████████████████████████████████▍ | 109/483 [04:13<13:44, 2.20s/it] [2024-04-18 17:26:53] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.23.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 23%|████████████████████████████████▍ | 109/483 [04:13<13:44, 2.20s/it] [2024-04-18 17:26:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 23%|████████████████████████████████▍ | 109/483 [04:14<13:44, 2.20s/it] [2024-04-18 17:26:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 23%|████████████████████████████████▍ | 109/483 [04:14<13:44, 2.20s/it] 23%|█████████████████████████████████ | 111/483 [04:14<09:32, 1.54s/it] [2024-04-18 17:26:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 23%|█████████████████████████████████ | 111/483 [04:14<09:32, 1.54s/it] [2024-04-18 17:26:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.23.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 23%|█████████████████████████████████ | 111/483 [04:15<09:32, 1.54s/it] 23%|█████████████████████████████████▍ | 112/483 [04:15<08:08, 1.32s/it] [2024-04-18 17:26:54] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00009-of-00030.safetensors + 23%|█████████████████████████████████▍ | 112/483 [04:15<08:08, 1.32s/it] [2024-04-18 17:26:55] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00010-of-00030.safetensors + 23%|█████████████████████████████████▍ | 112/483 [04:15<08:08, 1.32s/it] [2024-04-18 17:27:04] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.24.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 23%|█████████████████████████████████▍ | 112/483 [04:24<08:08, 1.32s/it] 23%|█████████████████████████████████▋ | 113/483 [04:24<20:30, 3.33s/it] [2024-04-18 17:27:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 23%|█████████████████████████████████▋ | 113/483 [04:26<20:30, 3.33s/it] [2024-04-18 17:27:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 23%|█████████████████████████████████▋ | 113/483 [04:26<20:30, 3.33s/it] 24%|█████████████████████████████████▉ | 114/483 [04:26<18:05, 2.94s/it] [2024-04-18 17:27:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 24%|█████████████████████████████████▉ | 114/483 [04:31<18:05, 2.94s/it] [2024-04-18 17:27:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 24%|█████████████████████████████████▉ | 114/483 [04:32<18:05, 2.94s/it] 24%|██████████████████████████████████▎ | 115/483 [04:32<22:41, 3.70s/it] [2024-04-18 17:27:12] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.24.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 24%|██████████████████████████████████▎ | 115/483 [04:32<22:41, 3.70s/it] [2024-04-18 17:27:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 24%|██████████████████████████████████▎ | 115/483 [04:33<22:41, 3.70s/it] [2024-04-18 17:27:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 24%|██████████████████████████████████▎ | 115/483 [04:33<22:41, 3.70s/it] 24%|██████████████████████████████████▉ | 117/483 [04:33<14:32, 2.38s/it] [2024-04-18 17:27:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 24%|██████████████████████████████████▉ | 117/483 [04:34<14:32, 2.38s/it] [2024-04-18 17:27:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.24.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 24%|██████████████████████████████████▉ | 117/483 [04:34<14:32, 2.38s/it] 24%|███████████████████████████████████▏ | 118/483 [04:34<11:38, 1.91s/it] [2024-04-18 17:27:14] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.25.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 24%|███████████████████████████████████▏ | 118/483 [04:34<11:38, 1.91s/it] [2024-04-18 17:27:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 24%|███████████████████████████████████▏ | 118/483 [04:35<11:38, 1.91s/it] [2024-04-18 17:27:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 24%|███████████████████████████████████▏ | 118/483 [04:35<11:38, 1.91s/it] 25%|███████████████████████████████████▊ | 120/483 [04:35<08:41, 1.44s/it] [2024-04-18 17:27:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 25%|███████████████████████████████████▊ | 120/483 [04:39<08:41, 1.44s/it] [2024-04-18 17:27:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 25%|███████████████████████████████████▊ | 120/483 [04:40<08:41, 1.44s/it] 25%|████████████████████████████████████ | 121/483 [04:40<13:40, 2.27s/it] [2024-04-18 17:27:20] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.25.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 25%|████████████████████████████████████ | 121/483 [04:40<13:40, 2.27s/it] [2024-04-18 17:27:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 25%|████████████████████████████████████ | 121/483 [04:41<13:40, 2.27s/it] [2024-04-18 17:27:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 25%|████████████████████████████████████ | 121/483 [04:41<13:40, 2.27s/it] 25%|████████████████████████████████████▋ | 123/483 [04:41<09:14, 1.54s/it] [2024-04-18 17:27:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 25%|████████████████████████████████████▋ | 123/483 [04:41<09:14, 1.54s/it] [2024-04-18 17:27:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.25.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 25%|████████████████████████████████████▋ | 123/483 [04:41<09:14, 1.54s/it] 26%|████████████████████████████████████▉ | 124/483 [04:42<07:42, 1.29s/it] [2024-04-18 17:27:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 26%|████████████████████████████████████▉ | 124/483 [04:46<07:42, 1.29s/it] [2024-04-18 17:27:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 26%|████████████████████████████████████▉ | 124/483 [04:46<07:42, 1.29s/it] 26%|█████████████████████████████████████▎ | 125/483 [04:46<12:47, 2.14s/it] [2024-04-18 17:27:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 26%|█████████████████████████████████████▎ | 125/483 [04:47<12:47, 2.14s/it] [2024-04-18 17:27:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 26%|█████████████████████████████████████▎ | 125/483 [04:47<12:47, 2.14s/it] 26%|█████████████████████████████████████▌ | 126/483 [04:47<10:46, 1.81s/it] [2024-04-18 17:27:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 26%|█████████████████████████████████████▌ | 126/483 [04:48<10:46, 1.81s/it] [2024-04-18 17:27:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 26%|█████████████████████████████████████▌ | 126/483 [04:48<10:46, 1.81s/it] 26%|█████████████████████████████████████▊ | 127/483 [04:48<08:37, 1.45s/it] [2024-04-18 17:27:28] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00010-of-00030.safetensors + 26%|█████████████████████████████████████▊ | 127/483 [04:48<08:37, 1.45s/it] [2024-04-18 17:27:28] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00011-of-00030.safetensors + 26%|█████████████████████████████████████▊ | 127/483 [04:48<08:37, 1.45s/it] [2024-04-18 17:27:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.26.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 26%|█████████████████████████████████████▊ | 127/483 [04:58<08:37, 1.45s/it] 27%|██████████████████████████████████████▏ | 128/483 [04:58<23:33, 3.98s/it] [2024-04-18 17:27:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 27%|██████████████████████████████████████▏ | 128/483 [05:00<23:33, 3.98s/it] [2024-04-18 17:27:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.26.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 27%|██████████████████████████████████████▏ | 128/483 [05:00<23:33, 3.98s/it] 27%|██████████████████████████████████████▍ | 129/483 [05:00<20:18, 3.44s/it] [2024-04-18 17:27:40] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.26.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 27%|██████████████████████████████████████▍ | 129/483 [05:00<20:18, 3.44s/it] [2024-04-18 17:27:40] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.27.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 27%|██████████████████████████████████████▍ | 129/483 [05:00<20:18, 3.44s/it] [2024-04-18 17:27:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 27%|██████████████████████████████████████▍ | 129/483 [05:02<20:18, 3.44s/it] [2024-04-18 17:27:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 27%|██████████████████████████████████████▍ | 129/483 [05:02<20:18, 3.44s/it] 27%|███████████████████████████████████████▎ | 132/483 [05:02<11:15, 1.92s/it] [2024-04-18 17:27:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 27%|███████████████████████████████████████▎ | 132/483 [05:07<11:15, 1.92s/it] [2024-04-18 17:27:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 27%|███████████████████████████████████████▎ | 132/483 [05:08<11:15, 1.92s/it] 28%|███████████████████████████████████████▋ | 133/483 [05:08<15:46, 2.70s/it] [2024-04-18 17:27:48] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.27.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 28%|███████████████████████████████████████▋ | 133/483 [05:08<15:46, 2.70s/it] [2024-04-18 17:27:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 28%|███████████████████████████████████████▋ | 133/483 [05:09<15:46, 2.70s/it] [2024-04-18 17:27:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 28%|███████████████████████████████████████▋ | 133/483 [05:09<15:46, 2.70s/it] 28%|████████████████████████████████████████▏ | 135/483 [05:09<10:48, 1.86s/it] [2024-04-18 17:27:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 28%|████████████████████████████████████████▏ | 135/483 [05:09<10:48, 1.86s/it] [2024-04-18 17:27:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.27.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 28%|████████████████████████████████████████▏ | 135/483 [05:09<10:48, 1.86s/it] 28%|████████████████████████████████████████▌ | 136/483 [05:09<09:02, 1.56s/it] [2024-04-18 17:27:49] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.28.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 28%|████████████████████████████████████████▌ | 136/483 [05:09<09:02, 1.56s/it] [2024-04-18 17:27:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 28%|████████████████████████████████████████▌ | 136/483 [05:11<09:02, 1.56s/it] [2024-04-18 17:27:51] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 28%|████████████████████████████████████████▌ | 136/483 [05:11<09:02, 1.56s/it] 29%|█████████████████████████████████████████▏ | 138/483 [05:11<07:14, 1.26s/it] [2024-04-18 17:27:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 29%|█████████████████████████████████████████▏ | 138/483 [05:15<07:14, 1.26s/it] [2024-04-18 17:27:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 29%|█████████████████████████████████████████▏ | 138/483 [05:16<07:14, 1.26s/it] 29%|█████████████████████████████████████████▍ | 139/483 [05:16<11:55, 2.08s/it] [2024-04-18 17:27:56] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.28.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 29%|█████████████████████████████████████████▍ | 139/483 [05:16<11:55, 2.08s/it] [2024-04-18 17:27:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 29%|█████████████████████████████████████████▍ | 139/483 [05:17<11:55, 2.08s/it] [2024-04-18 17:27:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 29%|█████████████████████████████████████████▍ | 139/483 [05:17<11:55, 2.08s/it] 29%|██████████████████████████████████████████ | 141/483 [05:17<08:10, 1.44s/it] [2024-04-18 17:27:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 29%|██████████████████████████████████████████ | 141/483 [05:17<08:10, 1.44s/it] [2024-04-18 17:27:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.28.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 29%|██████████████████████████████████████████ | 141/483 [05:17<08:10, 1.44s/it] 29%|██████████████████████████████████████████▎ | 142/483 [05:17<06:55, 1.22s/it] [2024-04-18 17:27:57] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00012-of-00030.safetensors + 29%|██████████████████████████████████████████▎ | 142/483 [05:17<06:55, 1.22s/it] [2024-04-18 17:28:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 29%|██████████████████████████████████████████▎ | 142/483 [05:32<06:55, 1.22s/it] [2024-04-18 17:28:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 29%|██████████████████████████████████████████▎ | 142/483 [05:33<06:55, 1.22s/it] 30%|██████████████████████████████████████████▋ | 143/483 [05:33<25:47, 4.55s/it] [2024-04-18 17:28:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 30%|██████████████████████████████████████████▋ | 143/483 [05:34<25:47, 4.55s/it] [2024-04-18 17:28:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 30%|██████████████████████████████████████████▋ | 143/483 [05:34<25:47, 4.55s/it] 30%|██████████████████████████████████████████▉ | 144/483 [05:34<21:03, 3.73s/it] [2024-04-18 17:28:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 30%|██████████████████████████████████████████▉ | 144/483 [05:34<21:03, 3.73s/it] [2024-04-18 17:28:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 30%|██████████████████████████████████████████▉ | 144/483 [05:35<21:03, 3.73s/it] 30%|███████████████████████████████████████████▏ | 145/483 [05:35<16:08, 2.87s/it] [2024-04-18 17:28:14] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.29.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 30%|███████████████████████████████████████████▏ | 145/483 [05:35<16:08, 2.87s/it] [2024-04-18 17:28:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 30%|███████████████████████████████████████████▏ | 145/483 [05:36<16:08, 2.87s/it] [2024-04-18 17:28:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.29.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 30%|███████████████████████████████████████████▏ | 145/483 [05:36<16:08, 2.87s/it] 30%|███████████████████████████████████████████▊ | 147/483 [05:36<11:27, 2.05s/it] [2024-04-18 17:28:16] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.29.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 30%|███████████████████████████████████████████▊ | 147/483 [05:36<11:27, 2.05s/it] [2024-04-18 17:28:16] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.30.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 30%|███████████████████████████████████████████▊ | 147/483 [05:36<11:27, 2.05s/it] [2024-04-18 17:28:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 30%|███████████████████████████████████████████▊ | 147/483 [05:38<11:27, 2.05s/it] [2024-04-18 17:28:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 30%|███████████████████████████████████████████▊ | 147/483 [05:38<11:27, 2.05s/it] 31%|████████████████████████████████████████████▋ | 150/483 [05:38<07:26, 1.34s/it] [2024-04-18 17:28:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 31%|████████████████████████████████████████████▋ | 150/483 [05:43<07:26, 1.34s/it] [2024-04-18 17:28:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 31%|████████████████████████████████████████████▋ | 150/483 [05:44<07:26, 1.34s/it] 31%|█████████████████████████████████████████████ | 151/483 [05:44<11:59, 2.17s/it] [2024-04-18 17:28:24] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.30.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 31%|█████████████████████████████████████████████ | 151/483 [05:44<11:59, 2.17s/it] [2024-04-18 17:28:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 31%|█████████████████████████████████████████████ | 151/483 [05:45<11:59, 2.17s/it] [2024-04-18 17:28:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 31%|█████████████████████████████████████████████ | 151/483 [05:45<11:59, 2.17s/it] 32%|█████████████████████████████████████████████▌ | 153/483 [05:45<08:41, 1.58s/it] [2024-04-18 17:28:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 32%|█████████████████████████████████████████████▌ | 153/483 [05:45<08:41, 1.58s/it] [2024-04-18 17:28:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.30.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 32%|█████████████████████████████████████████████▌ | 153/483 [05:45<08:41, 1.58s/it] 32%|█████████████████████████████████████████████▉ | 154/483 [05:45<07:25, 1.35s/it] [2024-04-18 17:28:25] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.31.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 32%|█████████████████████████████████████████████▉ | 154/483 [05:45<07:25, 1.35s/it] [2024-04-18 17:28:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 32%|█████████████████████████████████████████████▉ | 154/483 [05:47<07:25, 1.35s/it] [2024-04-18 17:28:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 32%|█████████████████████████████████████████████▉ | 154/483 [05:47<07:25, 1.35s/it] 32%|██████████████████████████████████████████████▌ | 156/483 [05:47<06:27, 1.19s/it] [2024-04-18 17:28:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 32%|██████████████████████████████████████████████▌ | 156/483 [05:51<06:27, 1.19s/it] [2024-04-18 17:28:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 32%|██████████████████████████████████████████████▌ | 156/483 [05:52<06:27, 1.19s/it] 33%|██████████████████████████████████████████████▊ | 157/483 [05:52<10:56, 2.02s/it] [2024-04-18 17:28:32] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.31.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 33%|██████████████████████████████████████████████▊ | 157/483 [05:52<10:56, 2.02s/it] [2024-04-18 17:28:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 33%|██████████████████████████████████████████████▊ | 157/483 [05:53<10:56, 2.02s/it] [2024-04-18 17:28:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 33%|██████████████████████████████████████████████▊ | 157/483 [05:53<10:56, 2.02s/it] 33%|███████████████████████████████████████████████▍ | 159/483 [05:53<07:45, 1.44s/it] [2024-04-18 17:28:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 33%|███████████████████████████████████████████████▍ | 159/483 [05:54<07:45, 1.44s/it] [2024-04-18 17:28:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.31.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 33%|███████████████████████████████████████████████▍ | 159/483 [05:54<07:45, 1.44s/it] 33%|███████████████████████████████████████████████▋ | 160/483 [05:54<06:35, 1.22s/it] [2024-04-18 17:28:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 33%|███████████████████████████████████████████████▋ | 160/483 [05:54<06:35, 1.22s/it] [2024-04-18 17:28:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 33%|███████████████████████████████████████████████▋ | 160/483 [05:54<06:35, 1.22s/it] 33%|████████████████████████████████████████████████ | 161/483 [05:54<06:01, 1.12s/it] [2024-04-18 17:28:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 33%|████████████████████████████████████████████████ | 161/483 [05:55<06:01, 1.12s/it] [2024-04-18 17:28:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 33%|████████████████████████████████████████████████ | 161/483 [05:55<06:01, 1.12s/it] 34%|████████████████████████████████████████████████▎ | 162/483 [05:55<05:04, 1.05it/s] [2024-04-18 17:28:35] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00011-of-00030.safetensors + 34%|████████████████████████████████████████████████▎ | 162/483 [05:55<05:04, 1.05it/s] [2024-04-18 17:28:35] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00012-of-00030.safetensors + 34%|████████████████████████████████████████████████▎ | 162/483 [05:55<05:04, 1.05it/s] [2024-04-18 17:28:36] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00013-of-00030.safetensors + 34%|████████████████████████████████████████████████▎ | 162/483 [05:56<05:04, 1.05it/s] [2024-04-18 17:28:45] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.32.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 34%|████████████████████████████████████████████████▎ | 162/483 [06:05<05:04, 1.05it/s] 34%|████████████████████████████████████████████████▌ | 163/483 [06:05<18:17, 3.43s/it] [2024-04-18 17:28:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 34%|████████████████████████████████████████████████▌ | 163/483 [06:08<18:17, 3.43s/it] [2024-04-18 17:28:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 34%|████████████████████████████████████████████████▌ | 163/483 [06:08<18:17, 3.43s/it] 34%|████████████████████████████████████████████████▉ | 164/483 [06:08<17:24, 3.27s/it] [2024-04-18 17:28:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 34%|████████████████████████████████████████████████▉ | 164/483 [06:13<17:24, 3.27s/it] [2024-04-18 17:28:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.32.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 34%|████████████████████████████████████████████████▉ | 164/483 [06:14<17:24, 3.27s/it] 34%|█████████████████████████████████████████████████▏ | 165/483 [06:14<21:24, 4.04s/it] [2024-04-18 17:28:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.32.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 34%|█████████████████████████████████████████████████▏ | 165/483 [06:14<21:24, 4.04s/it] [2024-04-18 17:28:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.33.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 34%|█████████████████████████████████████████████████▏ | 165/483 [06:14<21:24, 4.04s/it] [2024-04-18 17:28:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 34%|█████████████████████████████████████████████████▏ | 165/483 [06:15<21:24, 4.04s/it] [2024-04-18 17:28:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 34%|█████████████████████████████████████████████████▏ | 165/483 [06:16<21:24, 4.04s/it] 35%|██████████████████████████████████████████████████ | 168/483 [06:16<11:04, 2.11s/it] [2024-04-18 17:28:59] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 35%|██████████████████████████████████████████████████ | 168/483 [06:20<11:04, 2.11s/it] [2024-04-18 17:29:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 35%|██████████████████████████████████████████████████ | 168/483 [06:20<11:04, 2.11s/it] 35%|██████████████████████████████████████████████████▍ | 169/483 [06:20<13:45, 2.63s/it] [2024-04-18 17:29:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.33.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 35%|██████████████████████████████████████████████████▍ | 169/483 [06:20<13:45, 2.63s/it] [2024-04-18 17:29:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 35%|██████████████████████████████████████████████████▍ | 169/483 [06:21<13:45, 2.63s/it] [2024-04-18 17:29:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 35%|██████████████████████████████████████████████████▍ | 169/483 [06:21<13:45, 2.63s/it] 35%|██████████████████████████████████████████████████▉ | 171/483 [06:21<09:15, 1.78s/it] [2024-04-18 17:29:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 35%|██████████████████████████████████████████████████▉ | 171/483 [06:21<09:15, 1.78s/it] [2024-04-18 17:29:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.33.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 35%|██████████████████████████████████████████████████▉ | 171/483 [06:21<09:15, 1.78s/it] 36%|███████████████████████████████████████████████████▎ | 172/483 [06:21<07:39, 1.48s/it] [2024-04-18 17:29:01] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.34.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 36%|███████████████████████████████████████████████████▎ | 172/483 [06:21<07:39, 1.48s/it] [2024-04-18 17:29:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 36%|███████████████████████████████████████████████████▎ | 172/483 [06:22<07:39, 1.48s/it] [2024-04-18 17:29:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 36%|███████████████████████████████████████████████████▎ | 172/483 [06:23<07:39, 1.48s/it] 36%|███████████████████████████████████████████████████▉ | 174/483 [06:23<06:06, 1.19s/it] [2024-04-18 17:29:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 36%|███████████████████████████████████████████████████▉ | 174/483 [06:28<06:06, 1.19s/it] [2024-04-18 17:29:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 36%|███████████████████████████████████████████████████▉ | 174/483 [06:28<06:06, 1.19s/it] 36%|████████████████████████████████████████████████████▏ | 175/483 [06:28<10:55, 2.13s/it] [2024-04-18 17:29:08] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.34.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 36%|████████████████████████████████████████████████████▏ | 175/483 [06:28<10:55, 2.13s/it] [2024-04-18 17:29:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 36%|████████████████████████████████████████████████████▏ | 175/483 [06:29<10:55, 2.13s/it] [2024-04-18 17:29:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 36%|████████████████████████████████████████████████████▏ | 175/483 [06:29<10:55, 2.13s/it] 37%|████████████████████████████████████████████████████▊ | 177/483 [06:29<07:23, 1.45s/it] [2024-04-18 17:29:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 37%|████████████████████████████████████████████████████▊ | 177/483 [06:29<07:23, 1.45s/it] [2024-04-18 17:29:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.34.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 37%|████████████████████████████████████████████████████▊ | 177/483 [06:29<07:23, 1.45s/it] 37%|█████████████████████████████████████████████████████ | 178/483 [06:29<06:10, 1.21s/it] [2024-04-18 17:29:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 37%|█████████████████████████████████████████████████████ | 178/483 [06:30<06:10, 1.21s/it] [2024-04-18 17:29:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 37%|█████████████████████████████████████████████████████ | 178/483 [06:30<06:10, 1.21s/it] 37%|█████████████████████████████████████████████████████▎ | 179/483 [06:30<05:57, 1.18s/it] [2024-04-18 17:29:10] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00013-of-00030.safetensors + 37%|█████████████████████████████████████████████████████▎ | 179/483 [06:30<05:57, 1.18s/it] [2024-04-18 17:29:11] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00014-of-00030.safetensors + 37%|█████████████████████████████████████████████████████▎ | 179/483 [06:31<05:57, 1.18s/it] [2024-04-18 17:29:21] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.35.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 37%|█████████████████████████████████████████████████████▎ | 179/483 [06:42<05:57, 1.18s/it] 37%|█████████████████████████████████████████████████████▋ | 180/483 [06:42<18:38, 3.69s/it] [2024-04-18 17:29:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 37%|█████████████████████████████████████████████████████▋ | 180/483 [06:43<18:38, 3.69s/it] [2024-04-18 17:29:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 37%|█████████████████████████████████████████████████████▋ | 180/483 [06:43<18:38, 3.69s/it] 37%|█████████████████████████████████████████████████████▉ | 181/483 [06:43<15:38, 3.11s/it] [2024-04-18 17:29:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 37%|█████████████████████████████████████████████████████▉ | 181/483 [06:47<15:38, 3.11s/it] [2024-04-18 17:29:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 37%|█████████████████████████████████████████████████████▉ | 181/483 [06:48<15:38, 3.11s/it] 38%|██████████████████████████████████████████████████████▎ | 182/483 [06:48<18:21, 3.66s/it] [2024-04-18 17:29:28] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.35.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 38%|██████████████████████████████████████████████████████▎ | 182/483 [06:48<18:21, 3.66s/it] [2024-04-18 17:29:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 38%|██████████████████████████████████████████████████████▎ | 182/483 [06:49<18:21, 3.66s/it] [2024-04-18 17:29:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.35.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 38%|██████████████████████████████████████████████████████▎ | 182/483 [06:49<18:21, 3.66s/it] 38%|██████████████████████████████████████████████████████▊ | 184/483 [06:49<10:48, 2.17s/it] [2024-04-18 17:29:29] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.36.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 38%|██████████████████████████████████████████████████████▊ | 184/483 [06:49<10:48, 2.17s/it] [2024-04-18 17:29:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 38%|██████████████████████████████████████████████████████▊ | 184/483 [06:50<10:48, 2.17s/it] [2024-04-18 17:29:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 38%|██████████████████████████████████████████████████████▊ | 184/483 [06:50<10:48, 2.17s/it] 39%|███████████████████████████████████████████████████████▍ | 186/483 [06:50<07:56, 1.61s/it] [2024-04-18 17:29:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 39%|███████████████████████████████████████████████████████▍ | 186/483 [06:54<07:56, 1.61s/it] [2024-04-18 17:29:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 39%|███████████████████████████████████████████████████████▍ | 186/483 [06:55<07:56, 1.61s/it] 39%|███████████████████████████████████████████████████████▊ | 187/483 [06:55<11:36, 2.35s/it] [2024-04-18 17:29:35] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.36.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 39%|███████████████████████████████████████████████████████▊ | 187/483 [06:55<11:36, 2.35s/it] [2024-04-18 17:29:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 39%|███████████████████████████████████████████████████████▊ | 187/483 [06:56<11:36, 2.35s/it] [2024-04-18 17:29:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 39%|███████████████████████████████████████████████████████▊ | 187/483 [06:56<11:36, 2.35s/it] 39%|████████████████████████████████████████████████████████▎ | 189/483 [06:56<07:53, 1.61s/it] [2024-04-18 17:29:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 39%|████████████████████████████████████████████████████████▎ | 189/483 [06:56<07:53, 1.61s/it] [2024-04-18 17:29:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.36.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 39%|████████████████████████████████████████████████████████▎ | 189/483 [06:56<07:53, 1.61s/it] 39%|████████████████████████████████████████████████████████▋ | 190/483 [06:56<06:37, 1.36s/it] [2024-04-18 17:29:36] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.37.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 39%|████████████████████████████████████████████████████████▋ | 190/483 [06:56<06:37, 1.36s/it] [2024-04-18 17:29:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 39%|████████████████████████████████████████████████████████▋ | 190/483 [06:58<06:37, 1.36s/it] [2024-04-18 17:29:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 39%|████████████████████████████████████████████████████████▋ | 190/483 [06:58<06:37, 1.36s/it] 40%|█████████████████████████████████████████████████████████▏ | 192/483 [06:58<05:28, 1.13s/it] [2024-04-18 17:29:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 40%|█████████████████████████████████████████████████████████▏ | 192/483 [07:02<05:28, 1.13s/it] [2024-04-18 17:29:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 40%|█████████████████████████████████████████████████████████▏ | 192/483 [07:03<05:28, 1.13s/it] 40%|█████████████████████████████████████████████████████████▌ | 193/483 [07:03<09:03, 1.87s/it] [2024-04-18 17:29:42] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.37.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 40%|█████████████████████████████████████████████████████████▌ | 193/483 [07:03<09:03, 1.87s/it] [2024-04-18 17:29:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 40%|█████████████████████████████████████████████████████████▌ | 193/483 [07:03<09:03, 1.87s/it] [2024-04-18 17:29:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 40%|█████████████████████████████████████████████████████████▌ | 193/483 [07:03<09:03, 1.87s/it] 40%|██████████████████████████████████████████████████████████▏ | 195/483 [07:04<06:23, 1.33s/it] [2024-04-18 17:29:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 40%|██████████████████████████████████████████████████████████▏ | 195/483 [07:04<06:23, 1.33s/it] [2024-04-18 17:29:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.37.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 40%|██████████████████████████████████████████████████████████▏ | 195/483 [07:04<06:23, 1.33s/it] 41%|██████████████████████████████████████████████████████████▍ | 196/483 [07:04<05:23, 1.13s/it] [2024-04-18 17:29:44] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00014-of-00030.safetensors + 41%|██████████████████████████████████████████████████████████▍ | 196/483 [07:04<05:23, 1.13s/it] [2024-04-18 17:29:44] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00015-of-00030.safetensors + 41%|██████████████████████████████████████████████████████████▍ | 196/483 [07:04<05:23, 1.13s/it] [2024-04-18 17:29:53] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.38.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 41%|██████████████████████████████████████████████████████████▍ | 196/483 [07:13<05:23, 1.13s/it] 41%|██████████████████████████████████████████████████████████▋ | 197/483 [07:13<14:35, 3.06s/it] [2024-04-18 17:29:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 41%|██████████████████████████████████████████████████████████▋ | 197/483 [07:14<14:35, 3.06s/it] [2024-04-18 17:29:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 41%|██████████████████████████████████████████████████████████▋ | 197/483 [07:15<14:35, 3.06s/it] 41%|███████████████████████████████████████████████████████████ | 198/483 [07:15<12:42, 2.68s/it] [2024-04-18 17:29:59] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 41%|███████████████████████████████████████████████████████████ | 198/483 [07:19<12:42, 2.68s/it] [2024-04-18 17:30:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 41%|███████████████████████████████████████████████████████████ | 198/483 [07:20<12:42, 2.68s/it] 41%|███████████████████████████████████████████████████████████▎ | 199/483 [07:20<15:58, 3.38s/it] [2024-04-18 17:30:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.38.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 41%|███████████████████████████████████████████████████████████▎ | 199/483 [07:20<15:58, 3.38s/it] [2024-04-18 17:30:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 41%|███████████████████████████████████████████████████████████▎ | 199/483 [07:21<15:58, 3.38s/it] [2024-04-18 17:30:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 41%|███████████████████████████████████████████████████████████▎ | 199/483 [07:21<15:58, 3.38s/it] 42%|███████████████████████████████████████████████████████████▉ | 201/483 [07:21<10:02, 2.14s/it] [2024-04-18 17:30:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 42%|███████████████████████████████████████████████████████████▉ | 201/483 [07:21<10:02, 2.14s/it] [2024-04-18 17:30:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.38.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 42%|███████████████████████████████████████████████████████████▉ | 201/483 [07:22<10:02, 2.14s/it] 42%|████████████████████████████████████████████████████████████▏ | 202/483 [07:22<08:09, 1.74s/it] [2024-04-18 17:30:01] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.39.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 42%|████████████████████████████████████████████████████████████▏ | 202/483 [07:22<08:09, 1.74s/it] [2024-04-18 17:30:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 42%|████████████████████████████████████████████████████████████▏ | 202/483 [07:23<08:09, 1.74s/it] [2024-04-18 17:30:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 42%|████████████████████████████████████████████████████████████▏ | 202/483 [07:23<08:09, 1.74s/it] 42%|████████████████████████████████████████████████████████████▊ | 204/483 [07:23<06:16, 1.35s/it] [2024-04-18 17:30:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 42%|████████████████████████████████████████████████████████████▊ | 204/483 [07:27<06:16, 1.35s/it] [2024-04-18 17:30:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 42%|████████████████████████████████████████████████████████████▊ | 204/483 [07:28<06:16, 1.35s/it] 42%|█████████████████████████████████████████████████████████████ | 205/483 [07:28<10:04, 2.17s/it] [2024-04-18 17:30:08] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.39.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 42%|█████████████████████████████████████████████████████████████ | 205/483 [07:28<10:04, 2.17s/it] [2024-04-18 17:30:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 42%|█████████████████████████████████████████████████████████████ | 205/483 [07:29<10:04, 2.17s/it] [2024-04-18 17:30:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 42%|█████████████████████████████████████████████████████████████ | 205/483 [07:29<10:04, 2.17s/it] 43%|█████████████████████████████████████████████████████████████▋ | 207/483 [07:29<07:17, 1.58s/it] [2024-04-18 17:30:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 43%|█████████████████████████████████████████████████████████████▋ | 207/483 [07:30<07:17, 1.58s/it] [2024-04-18 17:30:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.39.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 43%|█████████████████████████████████████████████████████████████▋ | 207/483 [07:30<07:17, 1.58s/it] 43%|██████████████████████████████████████████████████████████████ | 208/483 [07:30<06:08, 1.34s/it] [2024-04-18 17:30:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 43%|██████████████████████████████████████████████████████████████ | 208/483 [07:33<06:08, 1.34s/it] [2024-04-18 17:30:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 43%|██████████████████████████████████████████████████████████████ | 208/483 [07:34<06:08, 1.34s/it] 43%|██████████████████████████████████████████████████████████████▎ | 209/483 [07:34<09:25, 2.06s/it] [2024-04-18 17:30:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 43%|██████████████████████████████████████████████████████████████▎ | 209/483 [07:35<09:25, 2.06s/it] [2024-04-18 17:30:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 43%|██████████████████████████████████████████████████████████████▎ | 209/483 [07:35<09:25, 2.06s/it] 43%|██████████████████████████████████████████████████████████████▌ | 210/483 [07:35<08:00, 1.76s/it] [2024-04-18 17:30:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 43%|██████████████████████████████████████████████████████████████▌ | 210/483 [07:36<08:00, 1.76s/it] [2024-04-18 17:30:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 43%|██████████████████████████████████████████████████████████████▌ | 210/483 [07:36<08:00, 1.76s/it] 44%|██████████████████████████████████████████████████████████████▉ | 211/483 [07:36<06:34, 1.45s/it] [2024-04-18 17:30:16] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00015-of-00030.safetensors + 44%|██████████████████████████████████████████████████████████████▉ | 211/483 [07:36<06:34, 1.45s/it] [2024-04-18 17:30:16] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00003-of-00030.safetensors + 44%|██████████████████████████████████████████████████████████████▉ | 211/483 [07:36<06:34, 1.45s/it] [2024-04-18 17:30:26] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.4.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 44%|██████████████████████████████████████████████████████████████▉ | 211/483 [07:46<06:34, 1.45s/it] 44%|███████████████████████████████████████████████████████████████▏ | 212/483 [07:46<17:10, 3.80s/it] [2024-04-18 17:30:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 44%|███████████████████████████████████████████████████████████████▏ | 212/483 [07:47<17:10, 3.80s/it] [2024-04-18 17:30:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 44%|███████████████████████████████████████████████████████████████▏ | 212/483 [07:47<17:10, 3.80s/it] 44%|███████████████████████████████████████████████████████████████▌ | 213/483 [07:47<14:20, 3.19s/it] [2024-04-18 17:30:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 44%|███████████████████████████████████████████████████████████████▌ | 213/483 [07:51<14:20, 3.19s/it] [2024-04-18 17:30:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.4.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 44%|███████████████████████████████████████████████████████████████▌ | 213/483 [07:52<14:20, 3.19s/it] 44%|███████████████████████████████████████████████████████████████▊ | 214/483 [07:52<16:39, 3.72s/it] [2024-04-18 17:30:32] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.4.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 44%|███████████████████████████████████████████████████████████████▊ | 214/483 [07:52<16:39, 3.72s/it] [2024-04-18 17:30:32] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.5.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 44%|███████████████████████████████████████████████████████████████▊ | 214/483 [07:52<16:39, 3.72s/it] [2024-04-18 17:30:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 44%|███████████████████████████████████████████████████████████████▊ | 214/483 [07:54<16:39, 3.72s/it] [2024-04-18 17:30:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 44%|███████████████████████████████████████████████████████████████▊ | 214/483 [07:54<16:39, 3.72s/it] 45%|████████████████████████████████████████████████████████████████▋ | 217/483 [07:54<08:51, 2.00s/it] [2024-04-18 17:30:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 45%|████████████████████████████████████████████████████████████████▋ | 217/483 [07:59<08:51, 2.00s/it] [2024-04-18 17:30:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 45%|████████████████████████████████████████████████████████████████▋ | 217/483 [08:00<08:51, 2.00s/it] 45%|████████████████████████████████████████████████████████████████▉ | 218/483 [08:00<12:13, 2.77s/it] [2024-04-18 17:30:40] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.5.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 45%|████████████████████████████████████████████████████████████████▉ | 218/483 [08:00<12:13, 2.77s/it] [2024-04-18 17:30:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 45%|████████████████████████████████████████████████████████████████▉ | 218/483 [08:01<12:13, 2.77s/it] [2024-04-18 17:30:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 45%|████████████████████████████████████████████████████████████████▉ | 218/483 [08:02<12:13, 2.77s/it] 46%|█████████████████████████████████████████████████████████████████▌ | 220/483 [08:02<08:54, 2.03s/it] [2024-04-18 17:30:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 46%|█████████████████████████████████████████████████████████████████▌ | 220/483 [08:02<08:54, 2.03s/it] [2024-04-18 17:30:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.5.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 46%|█████████████████████████████████████████████████████████████████▌ | 220/483 [08:02<08:54, 2.03s/it] 46%|█████████████████████████████████████████████████████████████████▉ | 221/483 [08:02<07:23, 1.69s/it] [2024-04-18 17:30:42] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.6.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 46%|█████████████████████████████████████████████████████████████████▉ | 221/483 [08:02<07:23, 1.69s/it] [2024-04-18 17:30:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 46%|█████████████████████████████████████████████████████████████████▉ | 221/483 [08:03<07:23, 1.69s/it] [2024-04-18 17:30:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 46%|█████████████████████████████████████████████████████████████████▉ | 221/483 [08:03<07:23, 1.69s/it] 46%|██████████████████████████████████████████████████████████████████▍ | 223/483 [08:03<05:44, 1.32s/it] [2024-04-18 17:30:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 46%|██████████████████████████████████████████████████████████████████▍ | 223/483 [08:08<05:44, 1.32s/it] [2024-04-18 17:30:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 46%|██████████████████████████████████████████████████████████████████▍ | 223/483 [08:09<05:44, 1.32s/it] 46%|██████████████████████████████████████████████████████████████████▊ | 224/483 [08:09<09:27, 2.19s/it] [2024-04-18 17:30:49] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.6.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 46%|██████████████████████████████████████████████████████████████████▊ | 224/483 [08:09<09:27, 2.19s/it] [2024-04-18 17:30:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 46%|██████████████████████████████████████████████████████████████████▊ | 224/483 [08:09<09:27, 2.19s/it] [2024-04-18 17:30:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 46%|██████████████████████████████████████████████████████████████████▊ | 224/483 [08:09<09:27, 2.19s/it] 47%|███████████████████████████████████████████████████████████████████▍ | 226/483 [08:09<06:22, 1.49s/it] [2024-04-18 17:30:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 47%|███████████████████████████████████████████████████████████████████▍ | 226/483 [08:10<06:22, 1.49s/it] [2024-04-18 17:30:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.6.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 47%|███████████████████████████████████████████████████████████████████▍ | 226/483 [08:10<06:22, 1.49s/it] 47%|███████████████████████████████████████████████████████████████████▋ | 227/483 [08:10<05:21, 1.26s/it] [2024-04-18 17:30:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 47%|███████████████████████████████████████████████████████████████████▋ | 227/483 [08:11<05:21, 1.26s/it] [2024-04-18 17:30:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 47%|███████████████████████████████████████████████████████████████████▋ | 227/483 [08:11<05:21, 1.26s/it] 47%|███████████████████████████████████████████████████████████████████▉ | 228/483 [08:11<04:52, 1.15s/it] [2024-04-18 17:30:50] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00003-of-00030.safetensors + 47%|███████████████████████████████████████████████████████████████████▉ | 228/483 [08:11<04:52, 1.15s/it] [2024-04-18 17:30:51] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00016-of-00030.safetensors + 47%|███████████████████████████████████████████████████████████████████▉ | 228/483 [08:11<04:52, 1.15s/it] [2024-04-18 17:31:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.40.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 47%|███████████████████████████████████████████████████████████████████▉ | 228/483 [08:20<04:52, 1.15s/it] 47%|████████████████████████████████████████████████████████████████████▎ | 229/483 [08:20<13:53, 3.28s/it] [2024-04-18 17:31:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 47%|████████████████████████████████████████████████████████████████████▎ | 229/483 [08:22<13:53, 3.28s/it] [2024-04-18 17:31:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.40.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 47%|████████████████████████████████████████████████████████████████████▎ | 229/483 [08:22<13:53, 3.28s/it] 48%|████████████████████████████████████████████████████████████████████▌ | 230/483 [08:22<12:04, 2.86s/it] [2024-04-18 17:31:02] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.40.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 48%|████████████████████████████████████████████████████████████████████▌ | 230/483 [08:22<12:04, 2.86s/it] [2024-04-18 17:31:02] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.41.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 48%|████████████████████████████████████████████████████████████████████▌ | 230/483 [08:22<12:04, 2.86s/it] [2024-04-18 17:31:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 48%|████████████████████████████████████████████████████████████████████▌ | 230/483 [08:23<12:04, 2.86s/it] [2024-04-18 17:31:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 48%|████████████████████████████████████████████████████████████████████▌ | 230/483 [08:24<12:04, 2.86s/it] 48%|█████████████████████████████████████████████████████████████████████▍ | 233/483 [08:24<06:46, 1.62s/it] [2024-04-18 17:31:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 48%|█████████████████████████████████████████████████████████████████████▍ | 233/483 [08:28<06:46, 1.62s/it] [2024-04-18 17:31:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 48%|█████████████████████████████████████████████████████████████████████▍ | 233/483 [08:29<06:46, 1.62s/it] 48%|█████████████████████████████████████████████████████████████████████▊ | 234/483 [08:29<09:42, 2.34s/it] [2024-04-18 17:31:09] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.41.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 48%|█████████████████████████████████████████████████████████████████████▊ | 234/483 [08:29<09:42, 2.34s/it] [2024-04-18 17:31:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 48%|█████████████████████████████████████████████████████████████████████▊ | 234/483 [08:30<09:42, 2.34s/it] [2024-04-18 17:31:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 48%|█████████████████████████████████████████████████████████████████████▊ | 234/483 [08:30<09:42, 2.34s/it] 49%|██████████████████████████████████████████████████████████████████████▎ | 236/483 [08:30<07:17, 1.77s/it] [2024-04-18 17:31:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 49%|██████████████████████████████████████████████████████████████████████▎ | 236/483 [08:31<07:17, 1.77s/it] [2024-04-18 17:31:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.41.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 49%|██████████████████████████████████████████████████████████████████████▎ | 236/483 [08:31<07:17, 1.77s/it] 49%|██████████████████████████████████████████████████████████████████████▋ | 237/483 [08:31<06:06, 1.49s/it] [2024-04-18 17:31:11] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.42.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 49%|██████████████████████████████████████████████████████████████████████▋ | 237/483 [08:31<06:06, 1.49s/it] [2024-04-18 17:31:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 49%|██████████████████████████████████████████████████████████████████████▋ | 237/483 [08:32<06:06, 1.49s/it] [2024-04-18 17:31:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 49%|██████████████████████████████████████████████████████████████████████▋ | 237/483 [08:33<06:06, 1.49s/it] 49%|███████████████████████████████████████████████████████████████████████▎ | 239/483 [08:33<05:14, 1.29s/it] [2024-04-18 17:31:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 49%|███████████████████████████████████████████████████████████████████████▎ | 239/483 [08:38<05:14, 1.29s/it] [2024-04-18 17:31:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 49%|███████████████████████████████████████████████████████████████████████▎ | 239/483 [08:38<05:14, 1.29s/it] 50%|███████████████████████████████████████████████████████████████████████▌ | 240/483 [08:38<08:59, 2.22s/it] [2024-04-18 17:31:18] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.42.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 50%|███████████████████████████████████████████████████████████████████████▌ | 240/483 [08:38<08:59, 2.22s/it] [2024-04-18 17:31:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 50%|███████████████████████████████████████████████████████████████████████▌ | 240/483 [08:39<08:59, 2.22s/it] [2024-04-18 17:31:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 50%|███████████████████████████████████████████████████████████████████████▌ | 240/483 [08:39<08:59, 2.22s/it] 50%|████████████████████████████████████████████████████████████████████████▏ | 242/483 [08:39<06:19, 1.57s/it] [2024-04-18 17:31:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 50%|████████████████████████████████████████████████████████████████████████▏ | 242/483 [08:40<06:19, 1.57s/it] [2024-04-18 17:31:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.42.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 50%|████████████████████████████████████████████████████████████████████████▏ | 242/483 [08:40<06:19, 1.57s/it] 50%|████████████████████████████████████████████████████████████████████████▍ | 243/483 [08:40<05:20, 1.34s/it] [2024-04-18 17:31:20] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00017-of-00030.safetensors + 50%|████████████████████████████████████████████████████████████████████████▍ | 243/483 [08:40<05:20, 1.34s/it] [2024-04-18 17:31:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 50%|████████████████████████████████████████████████████████████████████████▍ | 243/483 [08:54<05:20, 1.34s/it] [2024-04-18 17:31:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 50%|████████████████████████████████████████████████████████████████████████▍ | 243/483 [08:55<05:20, 1.34s/it] 51%|████████████████████████████████████████████████████████████████████████▋ | 244/483 [08:55<17:56, 4.50s/it] [2024-04-18 17:31:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 51%|████████████████████████████████████████████████████████████████████████▋ | 244/483 [08:56<17:56, 4.50s/it] [2024-04-18 17:31:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 51%|████████████████████████████████████████████████████████████████████████▋ | 244/483 [08:56<17:56, 4.50s/it] 51%|█████████████████████████████████████████████████████████████████████████ | 245/483 [08:56<14:36, 3.68s/it] [2024-04-18 17:31:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 51%|█████████████████████████████████████████████████████████████████████████ | 245/483 [08:56<14:36, 3.68s/it] [2024-04-18 17:31:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████ | 245/483 [08:56<14:36, 3.68s/it] 51%|█████████████████████████████████████████████████████████████████████████▎ | 246/483 [08:56<11:05, 2.81s/it] [2024-04-18 17:31:36] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.43.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████▎ | 246/483 [08:56<11:05, 2.81s/it] [2024-04-18 17:31:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 51%|█████████████████████████████████████████████████████████████████████████▎ | 246/483 [08:58<11:05, 2.81s/it] [2024-04-18 17:31:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.43.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████▎ | 246/483 [08:58<11:05, 2.81s/it] 51%|█████████████████████████████████████████████████████████████████████████▉ | 248/483 [08:58<07:33, 1.93s/it] [2024-04-18 17:31:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.43.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████▉ | 248/483 [08:58<07:33, 1.93s/it] [2024-04-18 17:31:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.44.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████▉ | 248/483 [08:58<07:33, 1.93s/it] [2024-04-18 17:31:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 51%|█████████████████████████████████████████████████████████████████████████▉ | 248/483 [08:59<07:33, 1.93s/it] [2024-04-18 17:31:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 51%|█████████████████████████████████████████████████████████████████████████▉ | 248/483 [08:59<07:33, 1.93s/it] 52%|██████████████████████████████████████████████████████████████████████████▊ | 251/483 [08:59<04:45, 1.23s/it] [2024-04-18 17:31:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 52%|██████████████████████████████████████████████████████████████████████████▊ | 251/483 [09:03<04:45, 1.23s/it] [2024-04-18 17:31:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 52%|██████████████████████████████████████████████████████████████████████████▊ | 251/483 [09:04<04:45, 1.23s/it] 52%|███████████████████████████████████████████████████████████████████████████▏ | 252/483 [09:04<07:13, 1.88s/it] [2024-04-18 17:31:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.44.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 52%|███████████████████████████████████████████████████████████████████████████▏ | 252/483 [09:04<07:13, 1.88s/it] [2024-04-18 17:31:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 52%|███████████████████████████████████████████████████████████████████████████▏ | 252/483 [09:05<07:13, 1.88s/it] [2024-04-18 17:31:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 52%|███████████████████████████████████████████████████████████████████████████▏ | 252/483 [09:05<07:13, 1.88s/it] 53%|███████████████████████████████████████████████████████████████████████████▋ | 254/483 [09:05<05:11, 1.36s/it] [2024-04-18 17:31:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 53%|███████████████████████████████████████████████████████████████████████████▋ | 254/483 [09:05<05:11, 1.36s/it] [2024-04-18 17:31:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.44.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 53%|███████████████████████████████████████████████████████████████████████████▋ | 254/483 [09:05<05:11, 1.36s/it] 53%|████████████████████████████████████████████████████████████████████████████ | 255/483 [09:05<04:24, 1.16s/it] [2024-04-18 17:31:45] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.45.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 53%|████████████████████████████████████████████████████████████████████████████ | 255/483 [09:05<04:24, 1.16s/it] [2024-04-18 17:31:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 53%|████████████████████████████████████████████████████████████████████████████ | 255/483 [09:06<04:24, 1.16s/it] [2024-04-18 17:31:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 53%|████████████████████████████████████████████████████████████████████████████ | 255/483 [09:07<04:24, 1.16s/it] 53%|████████████████████████████████████████████████████████████████████████████▌ | 257/483 [09:07<03:49, 1.01s/it] [2024-04-18 17:31:50] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 53%|████████████████████████████████████████████████████████████████████████████▌ | 257/483 [09:11<03:49, 1.01s/it] [2024-04-18 17:31:51] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 53%|████████████████████████████████████████████████████████████████████████████▌ | 257/483 [09:11<03:49, 1.01s/it] 53%|████████████████████████████████████████████████████████████████████████████▉ | 258/483 [09:11<06:35, 1.76s/it] [2024-04-18 17:31:51] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.45.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 53%|████████████████████████████████████████████████████████████████████████████▉ | 258/483 [09:11<06:35, 1.76s/it] [2024-04-18 17:31:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 53%|████████████████████████████████████████████████████████████████████████████▉ | 258/483 [09:12<06:35, 1.76s/it] [2024-04-18 17:31:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 53%|████████████████████████████████████████████████████████████████████████████▉ | 258/483 [09:12<06:35, 1.76s/it] 54%|█████████████████████████████████████████████████████████████████████████████▌ | 260/483 [09:12<04:37, 1.24s/it] [2024-04-18 17:31:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 54%|█████████████████████████████████████████████████████████████████████████████▌ | 260/483 [09:12<04:37, 1.24s/it] [2024-04-18 17:31:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.45.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 54%|█████████████████████████████████████████████████████████████████████████████▌ | 260/483 [09:12<04:37, 1.24s/it] 54%|█████████████████████████████████████████████████████████████████████████████▊ | 261/483 [09:12<03:54, 1.05s/it] [2024-04-18 17:31:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 54%|█████████████████████████████████████████████████████████████████████████████▊ | 261/483 [09:13<03:54, 1.05s/it] [2024-04-18 17:31:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 54%|█████████████████████████████████████████████████████████████████████████████▊ | 261/483 [09:13<03:54, 1.05s/it] 54%|██████████████████████████████████████████████████████████████████████████████ | 262/483 [09:13<03:38, 1.01it/s] [2024-04-18 17:31:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 54%|██████████████████████████████████████████████████████████████████████████████ | 262/483 [09:13<03:38, 1.01it/s] [2024-04-18 17:31:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 54%|██████████████████████████████████████████████████████████████████████████████ | 262/483 [09:13<03:38, 1.01it/s] 54%|██████████████████████████████████████████████████████████████████████████████▍ | 263/483 [09:13<03:02, 1.21it/s] [2024-04-18 17:31:53] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00016-of-00030.safetensors + 54%|██████████████████████████████████████████████████████████████████████████████▍ | 263/483 [09:13<03:02, 1.21it/s] [2024-04-18 17:31:54] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00017-of-00030.safetensors + 54%|██████████████████████████████████████████████████████████████████████████████▍ | 263/483 [09:14<03:02, 1.21it/s] [2024-04-18 17:31:54] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00018-of-00030.safetensors + 54%|██████████████████████████████████████████████████████████████████████████████▍ | 263/483 [09:14<03:02, 1.21it/s] [2024-04-18 17:32:04] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.46.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 54%|██████████████████████████████████████████████████████████████████████████████▍ | 263/483 [09:24<03:02, 1.21it/s] 55%|██████████████████████████████████████████████████████████████████████████████▋ | 264/483 [09:24<12:29, 3.42s/it] [2024-04-18 17:32:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 55%|██████████████████████████████████████████████████████████████████████████████▋ | 264/483 [09:26<12:29, 3.42s/it] [2024-04-18 17:32:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 55%|██████████████████████████████████████████████████████████████████████████████▋ | 264/483 [09:26<12:29, 3.42s/it] 55%|███████████████████████████████████████████████████████████████████████████████ | 265/483 [09:26<11:05, 3.05s/it] [2024-04-18 17:32:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 55%|███████████████████████████████████████████████████████████████████████████████ | 265/483 [09:32<11:05, 3.05s/it] [2024-04-18 17:32:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.46.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 55%|███████████████████████████████████████████████████████████████████████████████ | 265/483 [09:33<11:05, 3.05s/it] 55%|███████████████████████████████████████████████████████████████████████████████▎ | 266/483 [09:33<14:33, 4.02s/it] [2024-04-18 17:32:13] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.46.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 55%|███████████████████████████████████████████████████████████████████████████████▎ | 266/483 [09:33<14:33, 4.02s/it] [2024-04-18 17:32:13] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.47.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 55%|███████████████████████████████████████████████████████████████████████████████▎ | 266/483 [09:33<14:33, 4.02s/it] [2024-04-18 17:32:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 55%|███████████████████████████████████████████████████████████████████████████████▎ | 266/483 [09:34<14:33, 4.02s/it] [2024-04-18 17:32:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 55%|███████████████████████████████████████████████████████████████████████████████▎ | 266/483 [09:34<14:33, 4.02s/it] 56%|████████████████████████████████████████████████████████████████████████████████▏ | 269/483 [09:34<07:35, 2.13s/it] [2024-04-18 17:32:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 56%|████████████████████████████████████████████████████████████████████████████████▏ | 269/483 [09:39<07:35, 2.13s/it] [2024-04-18 17:32:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 56%|████████████████████████████████████████████████████████████████████████████████▏ | 269/483 [09:40<07:35, 2.13s/it] 56%|████████████████████████████████████████████████████████████████████████████████▍ | 270/483 [09:40<09:55, 2.80s/it] [2024-04-18 17:32:20] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.47.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 56%|████████████████████████████████████████████████████████████████████████████████▍ | 270/483 [09:40<09:55, 2.80s/it] [2024-04-18 17:32:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 56%|████████████████████████████████████████████████████████████████████████████████▍ | 270/483 [09:41<09:55, 2.80s/it] [2024-04-18 17:32:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 56%|████████████████████████████████████████████████████████████████████████████████▍ | 270/483 [09:41<09:55, 2.80s/it] 56%|█████████████████████████████████████████████████████████████████████████████████ | 272/483 [09:41<06:47, 1.93s/it] [2024-04-18 17:32:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 56%|█████████████████████████████████████████████████████████████████████████████████ | 272/483 [09:41<06:47, 1.93s/it] [2024-04-18 17:32:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.47.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 56%|█████████████████████████████████████████████████████████████████████████████████ | 272/483 [09:41<06:47, 1.93s/it] 57%|█████████████████████████████████████████████████████████████████████████████████▍ | 273/483 [09:41<05:35, 1.60s/it] [2024-04-18 17:32:21] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.48.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 57%|█████████████████████████████████████████████████████████████████████████████████▍ | 273/483 [09:41<05:35, 1.60s/it] [2024-04-18 17:32:22] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 57%|█████████████████████████████████████████████████████████████████████████████████▍ | 273/483 [09:42<05:35, 1.60s/it] [2024-04-18 17:32:22] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 57%|█████████████████████████████████████████████████████████████████████████████████▍ | 273/483 [09:43<05:35, 1.60s/it] 57%|█████████████████████████████████████████████████████████████████████████████████▉ | 275/483 [09:43<04:28, 1.29s/it] [2024-04-18 17:32:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 57%|█████████████████████████████████████████████████████████████████████████████████▉ | 275/483 [09:48<04:28, 1.29s/it] [2024-04-18 17:32:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 57%|█████████████████████████████████████████████████████████████████████████████████▉ | 275/483 [09:48<04:28, 1.29s/it] 57%|██████████████████████████████████████████████████████████████████████████████████▎ | 276/483 [09:48<07:29, 2.17s/it] [2024-04-18 17:32:28] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.48.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 57%|██████████████████████████████████████████████████████████████████████████████████▎ | 276/483 [09:48<07:29, 2.17s/it] [2024-04-18 17:32:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 57%|██████████████████████████████████████████████████████████████████████████████████▎ | 276/483 [09:49<07:29, 2.17s/it] [2024-04-18 17:32:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 57%|██████████████████████████████████████████████████████████████████████████████████▎ | 276/483 [09:49<07:29, 2.17s/it] 58%|██████████████████████████████████████████████████████████████████████████████████▉ | 278/483 [09:49<05:09, 1.51s/it] [2024-04-18 17:32:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 58%|██████████████████████████████████████████████████████████████████████████████████▉ | 278/483 [09:49<05:09, 1.51s/it] [2024-04-18 17:32:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.48.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 58%|██████████████████████████████████████████████████████████████████████████████████▉ | 278/483 [09:49<05:09, 1.51s/it] 58%|███████████████████████████████████████████████████████████████████████████████████▏ | 279/483 [09:49<04:17, 1.26s/it] [2024-04-18 17:32:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 58%|███████████████████████████████████████████████████████████████████████████████████▏ | 279/483 [09:50<04:17, 1.26s/it] [2024-04-18 17:32:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 58%|███████████████████████████████████████████████████████████████████████████████████▏ | 279/483 [09:50<04:17, 1.26s/it] 58%|███████████████████████████████████████████████████████████████████████████████████▍ | 280/483 [09:50<03:42, 1.10s/it] [2024-04-18 17:32:30] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00018-of-00030.safetensors + 58%|███████████████████████████████████████████████████████████████████████████████████▍ | 280/483 [09:50<03:42, 1.10s/it] [2024-04-18 17:32:30] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00019-of-00030.safetensors + 58%|███████████████████████████████████████████████████████████████████████████████████▍ | 280/483 [09:50<03:42, 1.10s/it] [2024-04-18 17:32:39] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.49.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 58%|███████████████████████████████████████████████████████████████████████████████████▍ | 280/483 [10:00<03:42, 1.10s/it] 58%|███████████████████████████████████████████████████████████████████████████████████▊ | 281/483 [10:00<11:04, 3.29s/it] [2024-04-18 17:32:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 58%|███████████████████████████████████████████████████████████████████████████████████▊ | 281/483 [10:01<11:04, 3.29s/it] [2024-04-18 17:32:41] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 58%|███████████████████████████████████████████████████████████████████████████████████▊ | 281/483 [10:01<11:04, 3.29s/it] 58%|████████████████████████████████████████████████████████████████████████████████████ | 282/483 [10:01<09:33, 2.85s/it] [2024-04-18 17:32:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 58%|████████████████████████████████████████████████████████████████████████████████████ | 282/483 [10:06<09:33, 2.85s/it] [2024-04-18 17:32:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 58%|████████████████████████████████████████████████████████████████████████████████████ | 282/483 [10:07<09:33, 2.85s/it] 59%|████████████████████████████████████████████████████████████████████████████████████▎ | 283/483 [10:07<11:42, 3.51s/it] [2024-04-18 17:32:46] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.49.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 59%|████████████████████████████████████████████████████████████████████████████████████▎ | 283/483 [10:07<11:42, 3.51s/it] [2024-04-18 17:32:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 59%|████████████████████████████████████████████████████████████████████████████████████▎ | 283/483 [10:07<11:42, 3.51s/it] [2024-04-18 17:32:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.49.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 59%|████████████████████████████████████████████████████████████████████████████████████▎ | 283/483 [10:07<11:42, 3.51s/it] 59%|████████████████████████████████████████████████████████████████████████████████████▉ | 285/483 [10:07<06:44, 2.04s/it] [2024-04-18 17:32:47] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.50.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 59%|████████████████████████████████████████████████████████████████████████████████████▉ | 285/483 [10:07<06:44, 2.04s/it] [2024-04-18 17:32:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 59%|████████████████████████████████████████████████████████████████████████████████████▉ | 285/483 [10:08<06:44, 2.04s/it] [2024-04-18 17:32:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 59%|████████████████████████████████████████████████████████████████████████████████████▉ | 285/483 [10:09<06:44, 2.04s/it] 59%|█████████████████████████████████████████████████████████████████████████████████████▌ | 287/483 [10:09<05:08, 1.58s/it] [2024-04-18 17:32:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 59%|█████████████████████████████████████████████████████████████████████████████████████▌ | 287/483 [10:12<05:08, 1.58s/it] [2024-04-18 17:32:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 59%|█████████████████████████████████████████████████████████████████████████████████████▌ | 287/483 [10:13<05:08, 1.58s/it] 60%|█████████████████████████████████████████████████████████████████████████████████████▊ | 288/483 [10:13<07:14, 2.23s/it] [2024-04-18 17:32:53] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.50.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 60%|█████████████████████████████████████████████████████████████████████████████████████▊ | 288/483 [10:13<07:14, 2.23s/it] [2024-04-18 17:32:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 60%|█████████████████████████████████████████████████████████████████████████████████████▊ | 288/483 [10:14<07:14, 2.23s/it] [2024-04-18 17:32:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 60%|█████████████████████████████████████████████████████████████████████████████████████▊ | 288/483 [10:14<07:14, 2.23s/it] 60%|██████████████████████████████████████████████████████████████████████████████████████▍ | 290/483 [10:14<05:03, 1.57s/it] [2024-04-18 17:32:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 60%|██████████████████████████████████████████████████████████████████████████████████████▍ | 290/483 [10:14<05:03, 1.57s/it] [2024-04-18 17:32:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.50.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 60%|██████████████████████████████████████████████████████████████████████████████████████▍ | 290/483 [10:15<05:03, 1.57s/it] 60%|██████████████████████████████████████████████████████████████████████████████████████▊ | 291/483 [10:15<04:13, 1.32s/it] [2024-04-18 17:32:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.51.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 60%|██████████████████████████████████████████████████████████████████████████████████████▊ | 291/483 [10:15<04:13, 1.32s/it] [2024-04-18 17:32:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 60%|██████████████████████████████████████████████████████████████████████████████████████▊ | 291/483 [10:16<04:13, 1.32s/it] [2024-04-18 17:32:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 60%|██████████████████████████████████████████████████████████████████████████████████████▊ | 291/483 [10:16<04:13, 1.32s/it] 61%|███████████████████████████████████████████████████████████████████████████████████████▎ | 293/483 [10:16<03:32, 1.12s/it] [2024-04-18 17:33:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 61%|███████████████████████████████████████████████████████████████████████████████████████▎ | 293/483 [10:20<03:32, 1.12s/it] [2024-04-18 17:33:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 61%|███████████████████████████████████████████████████████████████████████████████████████▎ | 293/483 [10:21<03:32, 1.12s/it] 61%|███████████████████████████████████████████████████████████████████████████████████████▋ | 294/483 [10:21<05:46, 1.83s/it] [2024-04-18 17:33:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.51.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 61%|███████████████████████████████████████████████████████████████████████████████████████▋ | 294/483 [10:21<05:46, 1.83s/it] [2024-04-18 17:33:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 61%|███████████████████████████████████████████████████████████████████████████████████████▋ | 294/483 [10:21<05:46, 1.83s/it] [2024-04-18 17:33:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 61%|███████████████████████████████████████████████████████████████████████████████████████▋ | 294/483 [10:22<05:46, 1.83s/it] 61%|████████████████████████████████████████████████████████████████████████████████████████▏ | 296/483 [10:22<04:05, 1.31s/it] [2024-04-18 17:33:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 61%|████████████████████████████████████████████████████████████████████████████████████████▏ | 296/483 [10:22<04:05, 1.31s/it] [2024-04-18 17:33:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.51.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 61%|████████████████████████████████████████████████████████████████████████████████████████▏ | 296/483 [10:22<04:05, 1.31s/it] 61%|████████████████████████████████████████████████████████████████████████████████████████▌ | 297/483 [10:22<03:24, 1.10s/it] [2024-04-18 17:33:02] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00019-of-00030.safetensors + 61%|████████████████████████████████████████████████████████████████████████████████████████▌ | 297/483 [10:22<03:24, 1.10s/it] [2024-04-18 17:33:02] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00020-of-00030.safetensors + 61%|████████████████████████████████████████████████████████████████████████████████████████▌ | 297/483 [10:22<03:24, 1.10s/it] [2024-04-18 17:33:11] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.52.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 61%|████████████████████████████████████████████████████████████████████████████████████████▌ | 297/483 [10:31<03:24, 1.10s/it] 62%|████████████████████████████████████████████████████████████████████████████████████████▊ | 298/483 [10:31<09:22, 3.04s/it] [2024-04-18 17:33:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 62%|████████████████████████████████████████████████████████████████████████████████████████▊ | 298/483 [10:32<09:22, 3.04s/it] [2024-04-18 17:33:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 62%|████████████████████████████████████████████████████████████████████████████████████████▊ | 298/483 [10:33<09:22, 3.04s/it] 62%|█████████████████████████████████████████████████████████████████████████████████████████▏ | 299/483 [10:33<08:16, 2.70s/it] [2024-04-18 17:33:17] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 62%|█████████████████████████████████████████████████████████████████████████████████████████▏ | 299/483 [10:37<08:16, 2.70s/it] [2024-04-18 17:33:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 62%|█████████████████████████████████████████████████████████████████████████████████████████▏ | 299/483 [10:38<08:16, 2.70s/it] 62%|█████████████████████████████████████████████████████████████████████████████████████████▍ | 300/483 [10:38<10:14, 3.36s/it] [2024-04-18 17:33:18] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.52.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 62%|█████████████████████████████████████████████████████████████████████████████████████████▍ | 300/483 [10:38<10:14, 3.36s/it] [2024-04-18 17:33:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 62%|█████████████████████████████████████████████████████████████████████████████████████████▍ | 300/483 [10:39<10:14, 3.36s/it] [2024-04-18 17:33:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 62%|█████████████████████████████████████████████████████████████████████████████████████████▍ | 300/483 [10:39<10:14, 3.36s/it] 63%|██████████████████████████████████████████████████████████████████████████████████████████ | 302/483 [10:39<06:14, 2.07s/it] [2024-04-18 17:33:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 63%|██████████████████████████████████████████████████████████████████████████████████████████ | 302/483 [10:39<06:14, 2.07s/it] [2024-04-18 17:33:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.52.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 63%|██████████████████████████████████████████████████████████████████████████████████████████ | 302/483 [10:39<06:14, 2.07s/it] 63%|██████████████████████████████████████████████████████████████████████████████████████████▎ | 303/483 [10:39<04:58, 1.66s/it] [2024-04-18 17:33:19] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.53.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 63%|██████████████████████████████████████████████████████████████████████████████████████████▎ | 303/483 [10:39<04:58, 1.66s/it] [2024-04-18 17:33:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 63%|██████████████████████████████████████████████████████████████████████████████████████████▎ | 303/483 [10:40<04:58, 1.66s/it] [2024-04-18 17:33:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 63%|██████████████████████████████████████████████████████████████████████████████████████████▎ | 303/483 [10:41<04:58, 1.66s/it] 63%|██████████████████████████████████████████████████████████████████████████████████████████▉ | 305/483 [10:41<03:54, 1.32s/it] [2024-04-18 17:33:25] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 63%|██████████████████████████████████████████████████████████████████████████████████████████▉ | 305/483 [10:45<03:54, 1.32s/it] [2024-04-18 17:33:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 63%|██████████████████████████████████████████████████████████████████████████████████████████▉ | 305/483 [10:46<03:54, 1.32s/it] 63%|███████████████████████████████████████████████████████████████████████████████████████████▏ | 306/483 [10:46<06:20, 2.15s/it] [2024-04-18 17:33:26] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.53.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 63%|███████████████████████████████████████████████████████████████████████████████████████████▏ | 306/483 [10:46<06:20, 2.15s/it] [2024-04-18 17:33:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 63%|███████████████████████████████████████████████████████████████████████████████████████████▏ | 306/483 [10:47<06:20, 2.15s/it] [2024-04-18 17:33:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 63%|███████████████████████████████████████████████████████████████████████████████████████████▏ | 306/483 [10:47<06:20, 2.15s/it] 64%|███████████████████████████████████████████████████████████████████████████████████████████▊ | 308/483 [10:47<04:18, 1.48s/it] [2024-04-18 17:33:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 64%|███████████████████████████████████████████████████████████████████████████████████████████▊ | 308/483 [10:47<04:18, 1.48s/it] [2024-04-18 17:33:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.53.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 64%|███████████████████████████████████████████████████████████████████████████████████████████▊ | 308/483 [10:47<04:18, 1.48s/it] 64%|████████████████████████████████████████████████████████████████████████████████████████████ | 309/483 [10:47<03:33, 1.23s/it] [2024-04-18 17:33:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 64%|████████████████████████████████████████████████████████████████████████████████████████████ | 309/483 [10:51<03:33, 1.23s/it] [2024-04-18 17:33:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 64%|████████████████████████████████████████████████████████████████████████████████████████████ | 309/483 [10:52<03:33, 1.23s/it] 64%|████████████████████████████████████████████████████████████████████████████████████████████▍ | 310/483 [10:52<06:21, 2.21s/it] [2024-04-18 17:33:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 64%|████████████████████████████████████████████████████████████████████████████████████████████▍ | 310/483 [10:53<06:21, 2.21s/it] [2024-04-18 17:33:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 64%|████████████████████████████████████████████████████████████████████████████████████████████▍ | 310/483 [10:53<06:21, 2.21s/it] 64%|████████████████████████████████████████████████████████████████████████████████████████████▋ | 311/483 [10:53<05:19, 1.86s/it] [2024-04-18 17:33:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 64%|████████████████████████████████████████████████████████████████████████████████████████████▋ | 311/483 [10:54<05:19, 1.86s/it] [2024-04-18 17:33:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 64%|████████████████████████████████████████████████████████████████████████████████████████████▋ | 311/483 [10:54<05:19, 1.86s/it] 65%|█████████████████████████████████████████████████████████████████████████████████████████████ | 312/483 [10:54<04:12, 1.48s/it] [2024-04-18 17:33:33] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00020-of-00030.safetensors + 65%|█████████████████████████████████████████████████████████████████████████████████████████████ | 312/483 [10:54<04:12, 1.48s/it] [2024-04-18 17:33:34] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00021-of-00030.safetensors + 65%|█████████████████████████████████████████████████████████████████████████████████████████████ | 312/483 [10:54<04:12, 1.48s/it] [2024-04-18 17:33:43] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.54.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████ | 312/483 [11:03<04:12, 1.48s/it] 65%|█████████████████████████████████████████████████████████████████████████████████████████████▎ | 313/483 [11:03<10:17, 3.63s/it] [2024-04-18 17:33:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▎ | 313/483 [11:04<10:17, 3.63s/it] [2024-04-18 17:33:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.54.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▎ | 313/483 [11:05<10:17, 3.63s/it] 65%|█████████████████████████████████████████████████████████████████████████████████████████████▌ | 314/483 [11:05<08:38, 3.07s/it] [2024-04-18 17:33:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.54.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▌ | 314/483 [11:05<08:38, 3.07s/it] [2024-04-18 17:33:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.55.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▌ | 314/483 [11:05<08:38, 3.07s/it] [2024-04-18 17:33:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▌ | 314/483 [11:06<08:38, 3.07s/it] [2024-04-18 17:33:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 65%|█████████████████████████████████████████████████████████████████████████████████████████████▌ | 314/483 [11:07<08:38, 3.07s/it] 66%|██████████████████████████████████████████████████████████████████████████████████████████████▌ | 317/483 [11:07<04:59, 1.80s/it] [2024-04-18 17:33:51] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 66%|██████████████████████████████████████████████████████████████████████████████████████████████▌ | 317/483 [11:11<04:59, 1.80s/it] [2024-04-18 17:33:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 66%|██████████████████████████████████████████████████████████████████████████████████████████████▌ | 317/483 [11:12<04:59, 1.80s/it] 66%|██████████████████████████████████████████████████████████████████████████████████████████████▊ | 318/483 [11:12<06:59, 2.54s/it] [2024-04-18 17:33:52] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.55.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 66%|██████████████████████████████████████████████████████████████████████████████████████████████▊ | 318/483 [11:12<06:59, 2.54s/it] [2024-04-18 17:33:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 66%|██████████████████████████████████████████████████████████████████████████████████████████████▊ | 318/483 [11:13<06:59, 2.54s/it] [2024-04-18 17:33:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 66%|██████████████████████████████████████████████████████████████████████████████████████████████▊ | 318/483 [11:13<06:59, 2.54s/it] 66%|███████████████████████████████████████████████████████████████████████████████████████████████▍ | 320/483 [11:13<04:57, 1.83s/it] [2024-04-18 17:33:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 66%|███████████████████████████████████████████████████████████████████████████████████████████████▍ | 320/483 [11:14<04:57, 1.83s/it] [2024-04-18 17:33:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.55.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 66%|███████████████████████████████████████████████████████████████████████████████████████████████▍ | 320/483 [11:14<04:57, 1.83s/it] 66%|███████████████████████████████████████████████████████████████████████████████████████████████▋ | 321/483 [11:14<04:12, 1.56s/it] [2024-04-18 17:33:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.56.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 66%|███████████████████████████████████████████████████████████████████████████████████████████████▋ | 321/483 [11:14<04:12, 1.56s/it] [2024-04-18 17:33:55] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 66%|███████████████████████████████████████████████████████████████████████████████████████████████▋ | 321/483 [11:15<04:12, 1.56s/it] [2024-04-18 17:33:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 66%|███████████████████████████████████████████████████████████████████████████████████████████████▋ | 321/483 [11:16<04:12, 1.56s/it] 67%|████████████████████████████████████████████████████████████████████████████████████████████████▎ | 323/483 [11:16<03:28, 1.31s/it] [2024-04-18 17:34:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 67%|████████████████████████████████████████████████████████████████████████████████████████████████▎ | 323/483 [11:21<03:28, 1.31s/it] [2024-04-18 17:34:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 67%|████████████████████████████████████████████████████████████████████████████████████████████████▎ | 323/483 [11:22<03:28, 1.31s/it] 67%|████████████████████████████████████████████████████████████████████████████████████████████████▌ | 324/483 [11:22<05:59, 2.26s/it] [2024-04-18 17:34:01] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.56.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 67%|████████████████████████████████████████████████████████████████████████████████████████████████▌ | 324/483 [11:22<05:59, 2.26s/it] [2024-04-18 17:34:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 67%|████████████████████████████████████████████████████████████████████████████████████████████████▌ | 324/483 [11:23<05:59, 2.26s/it] [2024-04-18 17:34:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 67%|████████████████████████████████████████████████████████████████████████████████████████████████▌ | 324/483 [11:23<05:59, 2.26s/it] 67%|█████████████████████████████████████████████████████████████████████████████████████████████████▏ | 326/483 [11:23<04:14, 1.62s/it] [2024-04-18 17:34:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 67%|█████████████████████████████████████████████████████████████████████████████████████████████████▏ | 326/483 [11:23<04:14, 1.62s/it] [2024-04-18 17:34:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.56.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 67%|█████████████████████████████████████████████████████████████████████████████████████████████████▏ | 326/483 [11:23<04:14, 1.62s/it] 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▍ | 327/483 [11:23<03:35, 1.38s/it] [2024-04-18 17:34:03] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00022-of-00030.safetensors + 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▍ | 327/483 [11:23<03:35, 1.38s/it] [2024-04-18 17:34:16] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▍ | 327/483 [11:36<03:35, 1.38s/it] [2024-04-18 17:34:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▍ | 327/483 [11:38<03:35, 1.38s/it] 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▊ | 328/483 [11:38<11:34, 4.48s/it] [2024-04-18 17:34:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▊ | 328/483 [11:39<11:34, 4.48s/it] [2024-04-18 17:34:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 68%|█████████████████████████████████████████████████████████████████████████████████████████████████▊ | 328/483 [11:39<11:34, 4.48s/it] 68%|██████████████████████████████████████████████████████████████████████████████████████████████████ | 329/483 [11:40<09:38, 3.76s/it] [2024-04-18 17:34:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 68%|██████████████████████████████████████████████████████████████████████████████████████████████████ | 329/483 [11:40<09:38, 3.76s/it] [2024-04-18 17:34:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 68%|██████████████████████████████████████████████████████████████████████████████████████████████████ | 329/483 [11:40<09:38, 3.76s/it] 68%|██████████████████████████████████████████████████████████████████████████████████████████████████▍ | 330/483 [11:40<07:23, 2.90s/it] [2024-04-18 17:34:20] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.57.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 68%|██████████████████████████████████████████████████████████████████████████████████████████████████▍ | 330/483 [11:40<07:23, 2.90s/it] [2024-04-18 17:34:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 68%|██████████████████████████████████████████████████████████████████████████████████████████████████▍ | 330/483 [11:42<07:23, 2.90s/it] [2024-04-18 17:34:22] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.57.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 68%|██████████████████████████████████████████████████████████████████████████████████████████████████▍ | 330/483 [11:42<07:23, 2.90s/it] 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▉ | 332/483 [11:42<05:16, 2.09s/it] [2024-04-18 17:34:22] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.57.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▉ | 332/483 [11:42<05:16, 2.09s/it] [2024-04-18 17:34:22] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.58.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▉ | 332/483 [11:42<05:16, 2.09s/it] [2024-04-18 17:34:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▉ | 332/483 [11:43<05:16, 2.09s/it] [2024-04-18 17:34:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▉ | 332/483 [11:44<05:16, 2.09s/it] 69%|███████████████████████████████████████████████████████████████████████████████████████████████████▉ | 335/483 [11:44<03:21, 1.36s/it] [2024-04-18 17:34:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 69%|███████████████████████████████████████████████████████████████████████████████████████████████████▉ | 335/483 [11:48<03:21, 1.36s/it] [2024-04-18 17:34:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 69%|███████████████████████████████████████████████████████████████████████████████████████████████████▉ | 335/483 [11:49<03:21, 1.36s/it] 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 336/483 [11:49<05:08, 2.10s/it] [2024-04-18 17:34:29] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.58.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 336/483 [11:49<05:08, 2.10s/it] [2024-04-18 17:34:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 336/483 [11:50<05:08, 2.10s/it] [2024-04-18 17:34:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 336/483 [11:50<05:08, 2.10s/it] 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 338/483 [11:50<03:43, 1.54s/it] [2024-04-18 17:34:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 338/483 [11:50<03:43, 1.54s/it] [2024-04-18 17:34:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.58.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 70%|████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 338/483 [11:50<03:43, 1.54s/it] 70%|█████████████████████████████████████████████████████████████████████████████████████████████████████ | 339/483 [11:50<03:09, 1.32s/it] [2024-04-18 17:34:30] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.59.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 70%|█████████████████████████████████████████████████████████████████████████████████████████████████████ | 339/483 [11:50<03:09, 1.32s/it] [2024-04-18 17:34:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 70%|█████████████████████████████████████████████████████████████████████████████████████████████████████ | 339/483 [11:52<03:09, 1.32s/it] [2024-04-18 17:34:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 70%|█████████████████████████████████████████████████████████████████████████████████████████████████████ | 339/483 [11:52<03:09, 1.32s/it] 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 341/483 [11:52<02:45, 1.17s/it] [2024-04-18 17:34:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 341/483 [11:57<02:45, 1.17s/it] [2024-04-18 17:34:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 341/483 [11:57<02:45, 1.17s/it] 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 342/483 [11:57<04:38, 1.98s/it] [2024-04-18 17:34:37] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.59.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 342/483 [11:57<04:38, 1.98s/it] [2024-04-18 17:34:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 342/483 [11:58<04:38, 1.98s/it] [2024-04-18 17:34:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 342/483 [11:58<04:38, 1.98s/it] 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 344/483 [11:58<03:20, 1.44s/it] [2024-04-18 17:34:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 344/483 [11:59<03:20, 1.44s/it] [2024-04-18 17:34:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.59.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 344/483 [11:59<03:20, 1.44s/it] 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 345/483 [11:59<02:49, 1.23s/it] [2024-04-18 17:34:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 345/483 [12:00<02:49, 1.23s/it] [2024-04-18 17:34:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 71%|██████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 345/483 [12:00<02:49, 1.23s/it] 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 346/483 [12:00<02:36, 1.14s/it] [2024-04-18 17:34:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 346/483 [12:00<02:36, 1.14s/it] [2024-04-18 17:34:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 346/483 [12:00<02:36, 1.14s/it] 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 347/483 [12:00<02:10, 1.04it/s] [2024-04-18 17:34:40] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00022-of-00030.safetensors + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 347/483 [12:00<02:10, 1.04it/s] [2024-04-18 17:34:40] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00021-of-00030.safetensors + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 347/483 [12:01<02:10, 1.04it/s] [2024-04-18 17:34:41] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00023-of-00030.safetensors + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 347/483 [12:01<02:10, 1.04it/s] [2024-04-18 17:34:50] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.60.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 347/483 [12:10<02:10, 1.04it/s] 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 348/483 [12:10<07:41, 3.42s/it] [2024-04-18 17:34:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 348/483 [12:13<07:41, 3.42s/it] [2024-04-18 17:34:53] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 72%|███████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 348/483 [12:13<07:41, 3.42s/it] 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████ | 349/483 [12:13<07:09, 3.21s/it] [2024-04-18 17:34:58] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████ | 349/483 [12:18<07:09, 3.21s/it] [2024-04-18 17:34:58] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.60.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████ | 349/483 [12:19<07:09, 3.21s/it] 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 350/483 [12:19<08:34, 3.87s/it] [2024-04-18 17:34:59] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.60.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 350/483 [12:19<08:34, 3.87s/it] [2024-04-18 17:34:59] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.61.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 350/483 [12:19<08:34, 3.87s/it] [2024-04-18 17:35:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 350/483 [12:20<08:34, 3.87s/it] [2024-04-18 17:35:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 72%|████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 350/483 [12:20<08:34, 3.87s/it] 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 353/483 [12:20<04:26, 2.05s/it] [2024-04-18 17:35:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 353/483 [12:25<04:26, 2.05s/it] [2024-04-18 17:35:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 353/483 [12:26<04:26, 2.05s/it] 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 354/483 [12:26<05:52, 2.73s/it] [2024-04-18 17:35:05] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.61.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 354/483 [12:26<05:52, 2.73s/it] [2024-04-18 17:35:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 354/483 [12:26<05:52, 2.73s/it] [2024-04-18 17:35:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 73%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 354/483 [12:27<05:52, 2.73s/it] 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 356/483 [12:27<03:58, 1.88s/it] [2024-04-18 17:35:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 356/483 [12:27<03:58, 1.88s/it] [2024-04-18 17:35:07] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.61.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 356/483 [12:27<03:58, 1.88s/it] 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 357/483 [12:27<03:15, 1.56s/it] [2024-04-18 17:35:07] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.62.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 357/483 [12:27<03:15, 1.56s/it] [2024-04-18 17:35:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 357/483 [12:28<03:15, 1.56s/it] [2024-04-18 17:35:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 74%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 357/483 [12:28<03:15, 1.56s/it] 74%|███████████████████████████████████████████████████████████████████████████████████████████████████████████ | 359/483 [12:28<02:37, 1.27s/it] [2024-04-18 17:35:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 74%|███████████████████████████████████████████████████████████████████████████████████████████████████████████ | 359/483 [12:32<02:37, 1.27s/it] [2024-04-18 17:35:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 74%|███████████████████████████████████████████████████████████████████████████████████████████████████████████ | 359/483 [12:33<02:37, 1.27s/it] 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 360/483 [12:33<03:58, 1.94s/it] [2024-04-18 17:35:13] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.62.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 360/483 [12:33<03:58, 1.94s/it] [2024-04-18 17:35:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 360/483 [12:34<03:58, 1.94s/it] [2024-04-18 17:35:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 360/483 [12:34<03:58, 1.94s/it] 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 362/483 [12:34<02:44, 1.36s/it] [2024-04-18 17:35:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 362/483 [12:34<02:44, 1.36s/it] [2024-04-18 17:35:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.62.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 75%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 362/483 [12:34<02:44, 1.36s/it] 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 363/483 [12:34<02:16, 1.14s/it] [2024-04-18 17:35:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 363/483 [12:35<02:16, 1.14s/it] [2024-04-18 17:35:15] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 363/483 [12:35<02:16, 1.14s/it] 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 364/483 [12:35<02:05, 1.05s/it] [2024-04-18 17:35:15] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00023-of-00030.safetensors + 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 364/483 [12:35<02:05, 1.05s/it] [2024-04-18 17:35:15] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00024-of-00030.safetensors + 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 364/483 [12:35<02:05, 1.05s/it] [2024-04-18 17:35:25] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.63.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 75%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 364/483 [12:45<02:05, 1.05s/it] 76%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 365/483 [12:45<06:28, 3.29s/it] [2024-04-18 17:35:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 76%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 365/483 [12:46<06:28, 3.29s/it] [2024-04-18 17:35:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 76%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 365/483 [12:46<06:28, 3.29s/it] 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 366/483 [12:46<05:32, 2.84s/it] [2024-04-18 17:35:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 366/483 [12:50<05:32, 2.84s/it] [2024-04-18 17:35:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 366/483 [12:51<05:32, 2.84s/it] 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 367/483 [12:51<06:35, 3.41s/it] [2024-04-18 17:35:31] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.63.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 367/483 [12:51<06:35, 3.41s/it] [2024-04-18 17:35:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 367/483 [12:52<06:35, 3.41s/it] [2024-04-18 17:35:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.63.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 76%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 367/483 [12:52<06:35, 3.41s/it] 76%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 369/483 [12:52<03:48, 2.00s/it] [2024-04-18 17:35:31] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.64.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 76%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 369/483 [12:52<03:48, 2.00s/it] [2024-04-18 17:35:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 76%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 369/483 [12:53<03:48, 2.00s/it] [2024-04-18 17:35:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 76%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 369/483 [12:53<03:48, 2.00s/it] 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 371/483 [12:53<02:50, 1.53s/it] [2024-04-18 17:35:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 371/483 [12:57<02:50, 1.53s/it] [2024-04-18 17:35:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 371/483 [12:58<02:50, 1.53s/it] 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 372/483 [12:58<04:08, 2.24s/it] [2024-04-18 17:35:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.64.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 372/483 [12:58<04:08, 2.24s/it] [2024-04-18 17:35:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 372/483 [12:59<04:08, 2.24s/it] [2024-04-18 17:35:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 77%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 372/483 [12:59<04:08, 2.24s/it] 77%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 374/483 [12:59<02:46, 1.53s/it] [2024-04-18 17:35:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 77%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 374/483 [12:59<02:46, 1.53s/it] [2024-04-18 17:35:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.64.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 77%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 374/483 [12:59<02:46, 1.53s/it] 78%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 375/483 [12:59<02:18, 1.29s/it] [2024-04-18 17:35:39] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.65.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 78%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 375/483 [12:59<02:18, 1.29s/it] [2024-04-18 17:35:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 78%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 375/483 [13:00<02:18, 1.29s/it] [2024-04-18 17:35:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 78%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 375/483 [13:01<02:18, 1.29s/it] 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 377/483 [13:01<01:51, 1.05s/it] [2024-04-18 17:35:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 377/483 [13:05<01:51, 1.05s/it] [2024-04-18 17:35:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 377/483 [13:05<01:51, 1.05s/it] 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 378/483 [13:05<03:14, 1.86s/it] [2024-04-18 17:35:45] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.65.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 378/483 [13:05<03:14, 1.86s/it] [2024-04-18 17:35:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 378/483 [13:06<03:14, 1.86s/it] [2024-04-18 17:35:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 78%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 378/483 [13:06<03:14, 1.86s/it] 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 380/483 [13:06<02:13, 1.30s/it] [2024-04-18 17:35:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 380/483 [13:06<02:13, 1.30s/it] [2024-04-18 17:35:46] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.65.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 380/483 [13:06<02:13, 1.30s/it] 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 381/483 [13:06<01:51, 1.09s/it] [2024-04-18 17:35:46] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00024-of-00030.safetensors + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 381/483 [13:06<01:51, 1.09s/it] [2024-04-18 17:35:47] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00025-of-00030.safetensors + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 381/483 [13:07<01:51, 1.09s/it] [2024-04-18 17:35:56] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.66.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 381/483 [13:16<01:51, 1.09s/it] 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 382/483 [13:16<05:05, 3.02s/it] [2024-04-18 17:35:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 382/483 [13:17<05:05, 3.02s/it] [2024-04-18 17:35:57] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 79%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 382/483 [13:18<05:05, 3.02s/it] 79%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 383/483 [13:18<04:31, 2.71s/it] [2024-04-18 17:36:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 79%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 383/483 [13:22<04:31, 2.71s/it] [2024-04-18 17:36:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 79%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 383/483 [13:24<04:31, 2.71s/it] 80%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 384/483 [13:24<05:54, 3.59s/it] [2024-04-18 17:36:03] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.66.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 80%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 384/483 [13:24<05:54, 3.59s/it] [2024-04-18 17:36:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 80%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 384/483 [13:25<05:54, 3.59s/it] [2024-04-18 17:36:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 80%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 384/483 [13:25<05:54, 3.59s/it] 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 386/483 [13:25<03:40, 2.28s/it] [2024-04-18 17:36:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 386/483 [13:25<03:40, 2.28s/it] [2024-04-18 17:36:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.66.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 386/483 [13:25<03:40, 2.28s/it] 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 387/483 [13:25<02:56, 1.84s/it] [2024-04-18 17:36:05] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.67.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 387/483 [13:25<02:56, 1.84s/it] [2024-04-18 17:36:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 387/483 [13:26<02:56, 1.84s/it] [2024-04-18 17:36:06] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 80%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 387/483 [13:27<02:56, 1.84s/it] 81%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 389/483 [13:27<02:13, 1.42s/it] [2024-04-18 17:36:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 81%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 389/483 [13:31<02:13, 1.42s/it] [2024-04-18 17:36:12] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 81%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 389/483 [13:32<02:13, 1.42s/it] 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 390/483 [13:32<03:32, 2.29s/it] [2024-04-18 17:36:12] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.67.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 390/483 [13:32<03:32, 2.29s/it] [2024-04-18 17:36:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 390/483 [13:33<03:32, 2.29s/it] [2024-04-18 17:36:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 390/483 [13:33<03:32, 2.29s/it] 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 392/483 [13:33<02:26, 1.61s/it] [2024-04-18 17:36:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 392/483 [13:33<02:26, 1.61s/it] [2024-04-18 17:36:13] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.67.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 81%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 392/483 [13:33<02:26, 1.61s/it] 81%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 393/483 [13:33<02:00, 1.34s/it] [2024-04-18 17:36:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 81%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 393/483 [13:38<02:00, 1.34s/it] [2024-04-18 17:36:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 81%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 393/483 [13:39<02:00, 1.34s/it] 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 394/483 [13:39<03:21, 2.27s/it] [2024-04-18 17:36:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 394/483 [13:40<03:21, 2.27s/it] [2024-04-18 17:36:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 394/483 [13:40<03:21, 2.27s/it] 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 395/483 [13:40<02:55, 1.99s/it] [2024-04-18 17:36:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 395/483 [13:40<02:55, 1.99s/it] [2024-04-18 17:36:20] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 82%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 395/483 [13:40<02:55, 1.99s/it] 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 396/483 [13:40<02:17, 1.58s/it] [2024-04-18 17:36:20] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00025-of-00030.safetensors + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 396/483 [13:40<02:17, 1.58s/it] [2024-04-18 17:36:21] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00026-of-00030.safetensors + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 396/483 [13:41<02:17, 1.58s/it] [2024-04-18 17:36:29] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.68.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 396/483 [13:50<02:17, 1.58s/it] 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 397/483 [13:50<05:18, 3.71s/it] [2024-04-18 17:36:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 397/483 [13:51<05:18, 3.71s/it] [2024-04-18 17:36:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.68.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 397/483 [13:51<05:18, 3.71s/it] 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 398/483 [13:51<04:26, 3.14s/it] [2024-04-18 17:36:31] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.68.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 398/483 [13:51<04:26, 3.14s/it] [2024-04-18 17:36:31] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.69.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 398/483 [13:51<04:26, 3.14s/it] [2024-04-18 17:36:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 398/483 [13:53<04:26, 3.14s/it] [2024-04-18 17:36:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 398/483 [13:53<04:26, 3.14s/it] 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 401/483 [13:53<02:20, 1.72s/it] [2024-04-18 17:36:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 401/483 [13:57<02:20, 1.72s/it] [2024-04-18 17:36:38] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 401/483 [13:58<02:20, 1.72s/it] 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 402/483 [13:58<03:20, 2.47s/it] [2024-04-18 17:36:38] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.69.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 402/483 [13:58<03:20, 2.47s/it] [2024-04-18 17:36:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 402/483 [14:00<03:20, 2.47s/it] [2024-04-18 17:36:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 83%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 402/483 [14:00<03:20, 2.47s/it] 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 404/483 [14:00<02:26, 1.86s/it] [2024-04-18 17:36:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 404/483 [14:00<02:26, 1.86s/it] [2024-04-18 17:36:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.69.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 404/483 [14:00<02:26, 1.86s/it] 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 405/483 [14:00<02:00, 1.55s/it] [2024-04-18 17:36:40] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.70.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 405/483 [14:00<02:00, 1.55s/it] [2024-04-18 17:36:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 405/483 [14:02<02:00, 1.55s/it] [2024-04-18 17:36:42] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 84%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 405/483 [14:02<02:00, 1.55s/it] 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 407/483 [14:02<01:39, 1.31s/it] [2024-04-18 17:36:47] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 407/483 [14:07<01:39, 1.31s/it] [2024-04-18 17:36:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 407/483 [14:08<01:39, 1.31s/it] 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 408/483 [14:08<02:47, 2.23s/it] [2024-04-18 17:36:48] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.70.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 408/483 [14:08<02:47, 2.23s/it] [2024-04-18 17:36:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 408/483 [14:09<02:47, 2.23s/it] [2024-04-18 17:36:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 408/483 [14:09<02:47, 2.23s/it] 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 410/483 [14:09<01:54, 1.57s/it] [2024-04-18 17:36:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 410/483 [14:09<01:54, 1.57s/it] [2024-04-18 17:36:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.70.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 410/483 [14:09<01:54, 1.57s/it] 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 411/483 [14:09<01:34, 1.31s/it] [2024-04-18 17:36:49] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00027-of-00030.safetensors + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 411/483 [14:09<01:34, 1.31s/it] [2024-04-18 17:37:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 411/483 [14:22<01:34, 1.31s/it] [2024-04-18 17:37:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 411/483 [14:24<01:34, 1.31s/it] 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 412/483 [14:24<05:11, 4.39s/it] [2024-04-18 17:37:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 412/483 [14:24<05:11, 4.39s/it] [2024-04-18 17:37:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 412/483 [14:25<05:11, 4.39s/it] 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 413/483 [14:25<04:06, 3.52s/it] [2024-04-18 17:37:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 413/483 [14:25<04:06, 3.52s/it] [2024-04-18 17:37:05] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 413/483 [14:25<04:06, 3.52s/it] 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 414/483 [14:25<03:05, 2.69s/it] [2024-04-18 17:37:05] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00026-of-00030.safetensors + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 414/483 [14:25<03:05, 2.69s/it] [2024-04-18 17:37:05] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00027-of-00030.safetensors + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 414/483 [14:25<03:05, 2.69s/it] [2024-04-18 17:37:06] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00004-of-00030.safetensors + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 414/483 [14:26<03:05, 2.69s/it] [2024-04-18 17:37:15] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.7.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 414/483 [14:36<03:05, 2.69s/it] 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 415/483 [14:36<05:28, 4.83s/it] [2024-04-18 17:37:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 415/483 [14:38<05:28, 4.83s/it] [2024-04-18 17:37:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 86%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 415/483 [14:38<05:28, 4.83s/it] 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 416/483 [14:38<04:44, 4.24s/it] [2024-04-18 17:37:23] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 416/483 [14:43<04:44, 4.24s/it] [2024-04-18 17:37:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 416/483 [14:44<04:44, 4.24s/it] 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 417/483 [14:44<05:08, 4.67s/it] [2024-04-18 17:37:24] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.7.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 417/483 [14:44<05:08, 4.67s/it] [2024-04-18 17:37:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 417/483 [14:44<05:08, 4.67s/it] [2024-04-18 17:37:24] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.7.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 417/483 [14:44<05:08, 4.67s/it] 87%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 419/483 [14:44<02:49, 2.65s/it] [2024-04-18 17:37:24] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.8.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 87%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 419/483 [14:44<02:49, 2.65s/it] [2024-04-18 17:37:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 87%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 419/483 [14:46<02:49, 2.65s/it] [2024-04-18 17:37:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 87%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 419/483 [14:46<02:49, 2.65s/it] 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 421/483 [14:46<02:00, 1.94s/it] [2024-04-18 17:37:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 421/483 [14:51<02:00, 1.94s/it] [2024-04-18 17:37:31] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 421/483 [14:52<02:00, 1.94s/it] 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 422/483 [14:52<02:47, 2.75s/it] [2024-04-18 17:37:31] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.8.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 422/483 [14:52<02:47, 2.75s/it] [2024-04-18 17:37:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 422/483 [14:52<02:47, 2.75s/it] [2024-04-18 17:37:32] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 422/483 [14:53<02:47, 2.75s/it] 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 424/483 [14:53<01:50, 1.87s/it] [2024-04-18 17:37:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 424/483 [14:53<01:50, 1.87s/it] [2024-04-18 17:37:33] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.8.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 424/483 [14:53<01:50, 1.87s/it] 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 425/483 [14:53<01:29, 1.55s/it] [2024-04-18 17:37:33] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.9.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 425/483 [14:53<01:29, 1.55s/it] [2024-04-18 17:37:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 425/483 [14:54<01:29, 1.55s/it] [2024-04-18 17:37:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 425/483 [14:54<01:29, 1.55s/it] 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 427/483 [14:54<01:09, 1.24s/it] [2024-04-18 17:37:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 427/483 [14:59<01:09, 1.24s/it] [2024-04-18 17:37:39] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 427/483 [14:59<01:09, 1.24s/it] 89%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 428/483 [14:59<01:50, 2.02s/it] [2024-04-18 17:37:39] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.9.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 89%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 428/483 [14:59<01:50, 2.02s/it] [2024-04-18 17:37:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 89%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 428/483 [15:00<01:50, 2.02s/it] [2024-04-18 17:37:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 89%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 428/483 [15:00<01:50, 2.02s/it] 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 430/483 [15:00<01:17, 1.45s/it] [2024-04-18 17:37:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 430/483 [15:01<01:17, 1.45s/it] [2024-04-18 17:37:40] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.9.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 430/483 [15:01<01:17, 1.45s/it] 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 431/483 [15:01<01:03, 1.22s/it] [2024-04-18 17:37:40] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00004-of-00030.safetensors + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 431/483 [15:01<01:03, 1.22s/it] [2024-04-18 17:37:41] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00027-of-00030.safetensors + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 431/483 [15:01<01:03, 1.22s/it] [2024-04-18 17:37:42] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.71.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 431/483 [15:02<01:03, 1.22s/it] 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 432/483 [15:02<01:01, 1.20s/it] [2024-04-18 17:37:43] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 432/483 [15:04<01:01, 1.20s/it] [2024-04-18 17:37:44] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.71.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 432/483 [15:04<01:01, 1.20s/it] 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 433/483 [15:04<01:09, 1.39s/it] [2024-04-18 17:37:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.71.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 433/483 [15:04<01:09, 1.39s/it] [2024-04-18 17:37:44] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.72.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 433/483 [15:04<01:09, 1.39s/it] [2024-04-18 17:37:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 433/483 [15:05<01:09, 1.39s/it] [2024-04-18 17:37:45] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 433/483 [15:06<01:09, 1.39s/it] 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 436/483 [15:06<00:46, 1.01it/s] [2024-04-18 17:37:51] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 436/483 [15:11<00:46, 1.01it/s] [2024-04-18 17:37:51] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 436/483 [15:12<00:46, 1.01it/s] 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 437/483 [15:12<01:30, 1.97s/it] [2024-04-18 17:37:51] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.72.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 437/483 [15:12<01:30, 1.97s/it] [2024-04-18 17:37:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 437/483 [15:12<01:30, 1.97s/it] [2024-04-18 17:37:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 437/483 [15:12<01:30, 1.97s/it] 91%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 439/483 [15:12<01:00, 1.38s/it] [2024-04-18 17:37:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 91%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 439/483 [15:13<01:00, 1.38s/it] [2024-04-18 17:37:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.72.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 91%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 439/483 [15:13<01:00, 1.38s/it] 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 440/483 [15:13<00:50, 1.16s/it] [2024-04-18 17:37:52] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.73.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 440/483 [15:13<00:50, 1.16s/it] [2024-04-18 17:37:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 440/483 [15:14<00:50, 1.16s/it] [2024-04-18 17:37:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 440/483 [15:14<00:50, 1.16s/it] 92%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 442/483 [15:14<00:43, 1.06s/it] [2024-04-18 17:37:59] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 92%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 442/483 [15:19<00:43, 1.06s/it] [2024-04-18 17:38:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 92%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 442/483 [15:20<00:43, 1.06s/it] 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 443/483 [15:20<01:20, 2.02s/it] [2024-04-18 17:38:00] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.73.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 443/483 [15:20<01:20, 2.02s/it] [2024-04-18 17:38:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 443/483 [15:21<01:20, 2.02s/it] [2024-04-18 17:38:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 443/483 [15:21<01:20, 2.02s/it] 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 445/483 [15:21<00:54, 1.44s/it] [2024-04-18 17:38:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 445/483 [15:21<00:54, 1.44s/it] [2024-04-18 17:38:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.73.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 445/483 [15:21<00:54, 1.44s/it] 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 446/483 [15:21<00:44, 1.21s/it] [2024-04-18 17:38:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 446/483 [15:22<00:44, 1.21s/it] [2024-04-18 17:38:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 446/483 [15:22<00:44, 1.21s/it] 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 447/483 [15:22<00:40, 1.12s/it] [2024-04-18 17:38:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 447/483 [15:22<00:40, 1.12s/it] [2024-04-18 17:38:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 447/483 [15:22<00:40, 1.12s/it] 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 448/483 [15:22<00:32, 1.08it/s] [2024-04-18 17:38:02] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00027-of-00030.safetensors + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 448/483 [15:22<00:32, 1.08it/s] [2024-04-18 17:38:03] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00028-of-00030.safetensors + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 448/483 [15:23<00:32, 1.08it/s] [2024-04-18 17:38:12] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.74.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 448/483 [15:32<00:32, 1.08it/s] 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 449/483 [15:32<01:52, 3.31s/it] [2024-04-18 17:38:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 449/483 [15:34<01:52, 3.31s/it] [2024-04-18 17:38:14] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 449/483 [15:34<01:52, 3.31s/it] 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 450/483 [15:34<01:34, 2.86s/it] [2024-04-18 17:38:18] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 450/483 [15:38<01:34, 2.86s/it] [2024-04-18 17:38:19] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.74.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 450/483 [15:40<01:34, 2.86s/it] 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 451/483 [15:40<01:56, 3.64s/it] [2024-04-18 17:38:20] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.74.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 451/483 [15:40<01:56, 3.64s/it] [2024-04-18 17:38:20] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.75.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 451/483 [15:40<01:56, 3.64s/it] [2024-04-18 17:38:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 451/483 [15:41<01:56, 3.64s/it] [2024-04-18 17:38:21] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 451/483 [15:41<01:56, 3.64s/it] 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 454/483 [15:42<00:57, 1.97s/it] [2024-04-18 17:38:26] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 454/483 [15:46<00:57, 1.97s/it] [2024-04-18 17:38:27] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 454/483 [15:47<00:57, 1.97s/it] 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 455/483 [15:47<01:14, 2.67s/it] [2024-04-18 17:38:27] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.75.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 455/483 [15:47<01:14, 2.67s/it] [2024-04-18 17:38:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 455/483 [15:48<01:14, 2.67s/it] [2024-04-18 17:38:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 455/483 [15:48<01:14, 2.67s/it] 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 457/483 [15:48<00:48, 1.85s/it] [2024-04-18 17:38:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 457/483 [15:48<00:48, 1.85s/it] [2024-04-18 17:38:28] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.75.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 457/483 [15:48<00:48, 1.85s/it] 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 458/483 [15:48<00:38, 1.56s/it] [2024-04-18 17:38:28] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.76.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 458/483 [15:48<00:38, 1.56s/it] [2024-04-18 17:38:29] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 458/483 [15:49<00:38, 1.56s/it] [2024-04-18 17:38:30] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 458/483 [15:50<00:38, 1.56s/it] 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 460/483 [15:50<00:29, 1.29s/it] [2024-04-18 17:38:34] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 460/483 [15:54<00:29, 1.29s/it] [2024-04-18 17:38:35] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 460/483 [15:55<00:29, 1.29s/it] 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 461/483 [15:55<00:46, 2.12s/it] [2024-04-18 17:38:35] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.76.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 461/483 [15:55<00:46, 2.12s/it] [2024-04-18 17:38:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 461/483 [15:56<00:46, 2.12s/it] [2024-04-18 17:38:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 95%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 461/483 [15:56<00:46, 2.12s/it] 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 463/483 [15:56<00:29, 1.50s/it] [2024-04-18 17:38:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 463/483 [15:56<00:29, 1.50s/it] [2024-04-18 17:38:36] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.76.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 463/483 [15:56<00:29, 1.50s/it] 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 464/483 [15:56<00:24, 1.27s/it] [2024-04-18 17:38:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 464/483 [15:57<00:24, 1.27s/it] [2024-04-18 17:38:37] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 464/483 [15:57<00:24, 1.27s/it] 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 465/483 [15:57<00:21, 1.17s/it] [2024-04-18 17:38:37] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00028-of-00030.safetensors + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 465/483 [15:57<00:21, 1.17s/it] [2024-04-18 17:38:38] INFO huggingface_loader.py:184: Loading HF parameters from: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00029-of-00030.safetensors + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 465/483 [15:58<00:21, 1.17s/it] [2024-04-18 17:38:47] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.77.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 465/483 [16:07<00:21, 1.17s/it] 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 466/483 [16:07<00:56, 3.35s/it] [2024-04-18 17:38:48] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 466/483 [16:09<00:56, 3.35s/it] [2024-04-18 17:38:49] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 466/483 [16:09<00:56, 3.35s/it] 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 467/483 [16:09<00:46, 2.94s/it] [2024-04-18 17:38:52] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 467/483 [16:13<00:46, 2.94s/it] [2024-04-18 17:38:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 467/483 [16:14<00:46, 2.94s/it] 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 468/483 [16:14<00:51, 3.43s/it] [2024-04-18 17:38:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.77.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 468/483 [16:14<00:51, 3.43s/it] [2024-04-18 17:38:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 468/483 [16:14<00:51, 3.43s/it] [2024-04-18 17:38:54] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.77.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 468/483 [16:14<00:51, 3.43s/it] 97%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 470/483 [16:14<00:26, 2.04s/it] [2024-04-18 17:38:54] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.78.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 97%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 470/483 [16:14<00:26, 2.04s/it] [2024-04-18 17:38:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 97%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 470/483 [16:16<00:26, 2.04s/it] [2024-04-18 17:38:56] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 97%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 470/483 [16:16<00:26, 2.04s/it] 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 472/483 [16:16<00:17, 1.59s/it] [2024-04-18 17:39:00] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 472/483 [16:21<00:17, 1.59s/it] [2024-04-18 17:39:01] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 472/483 [16:21<00:17, 1.59s/it] 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 473/483 [16:21<00:24, 2.40s/it] [2024-04-18 17:39:01] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.78.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 473/483 [16:21<00:24, 2.40s/it] [2024-04-18 17:39:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 473/483 [16:22<00:24, 2.40s/it] [2024-04-18 17:39:02] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 473/483 [16:22<00:24, 2.40s/it] 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 475/483 [16:22<00:13, 1.68s/it] [2024-04-18 17:39:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 475/483 [16:23<00:13, 1.68s/it] [2024-04-18 17:39:03] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.78.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 475/483 [16:23<00:13, 1.68s/it] 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 476/483 [16:23<00:10, 1.43s/it] [2024-04-18 17:39:03] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.79.input_layernorm.weight[0m", shape: (8192,), dtype: float16 + 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 476/483 [16:23<00:10, 1.43s/it] [2024-04-18 17:39:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.mlp.down_proj.q_weight[0m", shape: (8192, 2868), dtype: uint32 + 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 476/483 [16:24<00:10, 1.43s/it] [2024-04-18 17:39:04] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.mlp.down_proj.q_scale[0m", shape: (8192, 717), dtype: float16 + 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 476/483 [16:25<00:10, 1.43s/it] 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 478/483 [16:25<00:06, 1.21s/it] [2024-04-18 17:39:08] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.mlp.gate_up_proj.q_weight[0m", shape: (57344, 820), dtype: uint32 + 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 478/483 [16:28<00:06, 1.21s/it] [2024-04-18 17:39:09] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.mlp.gate_up_proj.q_scale[0m", shape: (57344, 205), dtype: float16 + 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 478/483 [16:29<00:06, 1.21s/it] 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 479/483 [16:29<00:07, 1.93s/it] [2024-04-18 17:39:09] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.layers.79.post_attention_layernorm.weight[0m", shape: (8192,), dtype: float16 + 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 479/483 [16:29<00:07, 1.93s/it] [2024-04-18 17:39:10] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.self_attn.qkv_proj.q_weight[0m", shape: (10240, 820), dtype: uint32 + 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 479/483 [16:31<00:07, 1.93s/it] [2024-04-18 17:39:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.self_attn.qkv_proj.q_scale[0m", shape: (10240, 205), dtype: float16 + 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 479/483 [16:31<00:07, 1.93s/it] 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍| 481/483 [16:31<00:02, 1.49s/it] [2024-04-18 17:39:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.self_attn.o_proj.q_weight[0m", shape: (8192, 820), dtype: uint32 + 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍| 481/483 [16:31<00:02, 1.49s/it] [2024-04-18 17:39:11] INFO huggingface_loader.py:166: [Quantized] Parameter: "[1mmodel.layers.79.self_attn.o_proj.q_scale[0m", shape: (8192, 205), dtype: float16 + 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍| 481/483 [16:31<00:02, 1.49s/it] 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋| 482/483 [16:31<00:01, 1.29s/it] [2024-04-18 17:39:11] INFO huggingface_loader.py:174: [Not quantized] Parameter: "[1mmodel.norm.weight[0m", shape: (8192,), dtype: float16 + 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋| 482/483 [16:31<00:01, 1.29s/it] 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 483/483 [16:31<00:00, 2.05s/it] +[2024-04-18 17:39:11] INFO huggingface_loader.py:196: Unloading HF weight file: /ssd1/cfruan/models/Meta-Llama-3-70B-Instruct/model-00029-of-00030.safetensors +[2024-04-18 17:39:12] INFO stats.py:76: [92mTime usage[0m: HF loading: 293.607 sec; Pre-quantization mapping: 562.017 sec; Quantization: 3.370 sec +[2024-04-18 17:39:12] INFO stats.py:90: [92mRAM usage[0m: Peak RAM: 17.375 GB. Total bytes loaded from disk: 271.521 GB +[2024-04-18 17:39:12] INFO convert_weight.py:156: [92mParameter size[0m after quantization: 29.594 GB +[2024-04-18 17:39:12] INFO convert_weight.py:161: [92mTotal parameters[0m: 72,885,788,672 +[2024-04-18 17:39:12] INFO convert_weight.py:162: [92mBits per parameter[0m: 3.488 +[2024-04-18 17:39:12] INFO convert_weight.py:167: Saved to directory: [1m/tmp/tmpbtropg_f[0m + +All finished, 456 total shards committed, record saved to /tmp/tmpbtropg_f/ndarray-cache.json diff --git a/mlc-chat-config.json b/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f6c0f2d517dc086baf58b3ebe1563550c9599d1 --- /dev/null +++ b/mlc-chat-config.json @@ -0,0 +1,75 @@ +{ + "model_type": "llama", + "quantization": "q3f16_1", + "model_config": { + "hidden_size": 8192, + "intermediate_size": 28672, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "rms_norm_eps": 1e-05, + "vocab_size": 128256, + "position_embedding_base": 500000.0, + "context_window_size": 8192, + "prefill_chunk_size": 1024, + "num_key_value_heads": 8, + "head_dim": 128, + "tensor_parallel_shards": 1, + "max_batch_size": 80 + }, + "vocab_size": 128256, + "context_window_size": 8192, + "sliding_window_size": -1, + "prefill_chunk_size": 1024, + "attention_sink_size": -1, + "tensor_parallel_shards": 1, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "temperature": 0.7, + "presence_penalty": 0.0, + "frequency_penalty": 0.0, + "repetition_penalty": 1.0, + "top_p": 0.95, + "conv_template": { + "name": "llama-3", + "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}", + "system_message": "You are a helpful, respectful and honest assistant.", + "system_prefix_token_ids": [ + 128000 + ], + "add_role_after_system_message": true, + "roles": { + "user": "user", + "assistant": "assistant" + }, + "role_templates": { + "user": "{user_message}", + "assistant": "{assistant_message}", + "tool": "{tool_message}" + }, + "messages": [], + "seps": [ + "<|eot_id|><|start_header_id|>" + ], + "role_content_sep": "<|end_header_id|>\n\n", + "role_empty_sep": "<|end_header_id|>\n\n", + "stop_str": [ + "<|end_of_text|>", + "<|eot_id|>" + ], + "stop_token_ids": [ + 128001, + 128009 + ], + "function_string": "", + "use_function_calling": false + }, + "pad_token_id": 0, + "bos_token_id": 128000, + "eos_token_id": 128001, + "tokenizer_files": [ + "tokenizer.json", + "tokenizer_config.json" + ], + "version": "0.1.0" +} \ No newline at end of file diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..d2e93caf53006d134232cf6bca74a03e62200327 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,12351 @@ +{ + "metadata": { + "ParamSize": 805, + "ParamBytes": 31776318464.0, + "BitsPerParam": 3.4877930573818188 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 420679680, + "records": [ + { + "name": "lm_head.q_weight", + "shape": [ + 128256, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 420679680, + "byteOffset": 0 + } + ], + "md5sum": "167d7a9b7af56de22920e15c021733ba" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 52584960, + "records": [ + { + "name": "lm_head.q_scale", + "shape": [ + 128256, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 52584960, + "byteOffset": 0 + } + ], + "md5sum": "e9321f4b3a03806c179878cf4fbe4670" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 420679680, + "records": [ + { + "name": "model.embed_tokens.q_weight", + "shape": [ + 128256, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 420679680, + "byteOffset": 0 + } + ], + "md5sum": "367cce4449b115480651d96ea625817a" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 52584960, + "records": [ + { + "name": "model.embed_tokens.q_scale", + "shape": [ + 128256, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 52584960, + "byteOffset": 0 + } + ], + "md5sum": "b5f743dc05d728ff752d216de7147ee9" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "707c508ebb5434986c6c8a0a44e76e91" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7b368b65d23096d193884ec7f5ca1ab2" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "280cea43c77fe8b0deb0fd4f67921297" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "0677e17311f61af3c62f2569e652dc17" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.0.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "8ecb7a37751d66f80e6ba1e70e6a41d5" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7c4ec25848dfd3807ef6865b65259b45" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "568acd6985613f8de692ee1e773594e8" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e4bffe8109760b617258054b97490aba" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "31903b7987bb48d71e59c60d1cf90bc6" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "522e2afd8bf8ef5a3d2811aefdcf23da" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 26910720, + "records": [ + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 0 + }, + { + "name": "model.layers.0.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 16384 + }, + { + "name": "model.layers.0.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.0.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11780096 + }, + { + "name": "model.layers.0.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15978496 + }, + { + "name": "model.layers.1.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19337216 + }, + { + "name": "model.layers.1.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23535616 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26894336 + } + ], + "md5sum": "77e61a21ca520d6ee0f66d9c368b9f8d" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e20695557f6e532523dc4b0d7c9f1c00" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6b898bd5e1276ca4b13c03a34f60c1a4" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "940576863d0726dd7008343c2dc6616c" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "05a7e439b9c0b0435f030500137032a8" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "91a767efcb34b6ad3cacbf309d152dc8" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2d9141d6284907247082c06581eb16ef" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.1.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.2.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.2.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.2.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.2.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "b87f11ce1a186450dc336402c7fb3eab" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ca63e01a0654271cd90876fbec515e9c" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "02d1d4b4751a06ad189fa65a5ffea28e" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d371b6ea796fd805554f637be178190f" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.3.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "4e2109c82094851dbf882f57a49f4024" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4e11293a996124f8e80dcc0417ad2e66" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.4.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "18258e03ebcc901f393c65fcffdbb9f8" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e5deb6dbfc92b796675896a08979f7bd" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.3.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.3.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.3.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.4.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.4.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "affcb808ef2058f0071291040f0cd3c3" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "efe12f17d9ac90e2534aa5c0a6ccbfae" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "ed457f46507dbfdbee7106a61abc5137" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "96688c04acb67786c57147e1e6834d51" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.10.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a0ffbb0799b735d18bf2472dc26fe9b9" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "43de48ceeb4babe5723571cc4a5c4c66" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "995d2408c0209d9a52a61b225eea574c" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "66879fe16480bc4c4c64b77592b9c688" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "35d2389b936717ba53516e37effad55b" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.10.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.10.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.10.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.11.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.11.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "e4dfb26316a3bb5a59335464c0a04111" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.11.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "a5d71153c967ee06579574cf5dd44842" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5c0da72336cd70220a0a75e98b1cb9ea" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4ef636f58eb922d3a2b8bacde5413efe" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "fe7da0b50ed3d6480007f43b62a5ff0c" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.11.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.12.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.12.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "f73ac212d075f130ec18ee8f7f6f5ebd" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "81a356e86a6a0500d8983f1b6d65f2b3" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "4dc8140b751eab0141c9b9a1eb0c2dcd" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b0263a969bea1bc223fa0a8cd0c5752b" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "73895dcc7f83f55dfbf944c67f397fc8" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "3102f39afa4d38ad746a57094d746d2d" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5499ae48149287bfd2e307f6f9d13f1e" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.12.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.12.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.13.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.13.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.13.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "a9f99e8b5140fcbdea5e3d1d396c71ff" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "a41cb72b3ae03a468ed5e26d20149dfd" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b66737e415becb62de23d09f05ca5d22" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0235eadd5eb98d31cc08d4bd694588db" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "0a959c43094a621da9a130b6a32e563a" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.14.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a843b3f16a6ebba9127514d9745147c6" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5c7ecc05f17bab1d8966f7f3c9ef229a" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "f8e2b636e96a6b26d8d45071b9069d28" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "3cadbc6d4fd3789cc561ef2938f1d6b6" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.15.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "26eab59c2db4a98b5f5b6044b44ec654" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "84bbb9d24428ef901ab7cb1930b7c035" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.14.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.14.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.14.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.14.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.15.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.15.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "4aee7bd8ff570ea0541eeb1adbbef77e" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "66397c19898ce97beb7ebeac832b0bf4" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "dc2227ed7d67a38dbacab3eb321cdef5" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "3a697897630e2fbbc0777ab1ab6d9b27" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "02e7cf9bc747f3b5796272699254472a" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.16.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a0bbf2cd12ba213b9cdcfdbd6692e8e4" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b795eafa8cd3e4f1591ed00d1ad12fff" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.15.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.16.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.16.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.16.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.16.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "0209c12c993ff7ce26959a5fda60045e" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "4ce443f86a2d174c40037ad35b3719bb" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "27ffcb6d7284cc59fca2270b458a4366" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d9b483e3acabc106c367bd090c4e7311" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.17.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9c4c2d0b0c7fff81c28b039d1c13ebd4" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "03984c9bb9126412b963b4d3324a05a9" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.18.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "67acaa5e5c60ff8b800e4ca790534e36" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "43e3e93e9506d8764726ee213efd95aa" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.17.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.17.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.17.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.18.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.18.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "5a1713176edd3e570b10d602c7461c2a" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "67f95cc6e53536136d2bd8950191bb3b" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "fec92d61ed3ffa910e9587c4e0727c27" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "828a358bc79572087931bbf848660866" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d602f3d45aa9a33925334326eb3d30cb" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "25dc8844f8e94db830fba945040ed85b" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "224383d6644728788ed4e106962a5355" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.19.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "fac45b07dc008a7a4e9c075c2be6c5f5" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "31c9c4a444c2e89fca28dbdef5ca58dc" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.18.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.19.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.19.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.19.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.19.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "5f9135006906dac1d55da4229e6960b0" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "a7e7966698f4820db430480be384f44b" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "3e73f71723f9a48e58ed7fcda5c8bde7" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f911c10c1b33be286e514f98879b07a6" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.20.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "2c74d59beb4631db32d0ee857ad58541" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dae763dcc9153bae1726800d88f98409" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c8d6e4dcb4e6903e5739cb097bc1e1a4" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 23535616, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.20.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.20.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.20.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.21.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23519232 + } + ], + "md5sum": "0ad51ee9350ba7923f5062aadfef27f0" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b0dc80264b70cf5030a9efbf0786ec26" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a4925c7bb26ea0ef2d5a93305dea00f7" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.21.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "53412b54a5958d3d48a53da327a4d17f" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "f4030f1054f78311e949edb143c50bab" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "cb27a1854b25d0c0a98cdf45efa3ecd1" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "4041f732d883d61a6e28dafc82b5de90" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "fa839e8042ef7952a13693c7ff0ed922" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e620506ff977bce0b2686c5a4f3ef907" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.21.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.21.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.22.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.22.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.22.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "94d576eadd73a3068c7911112e00762b" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1bf1c966ad4245d50391fc7bbd58d11c" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "a218c109571370f42fc34a005eea0123" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "93d15bd907da7ce514e7f9d9f292976b" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "cdc473999ff40da17ad59affd3f90eb6" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.23.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "99d2be7c8689e8818ba8f0e06d196d31" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "165ed44149d22c9f2465e227b00506b7" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.23.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.23.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.23.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.23.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "38d1c7bb4839a65640b06efdd338d3e1" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "67a26d5603aba74e02b629a225e66e13" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "af197d7456a59b3f193e7cfd224a3edc" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "bdbc63c67d5087d07b826e262f1ed0de" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.24.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "40c9bca3a2d1d886783cb09b9d74b13f" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1a05e0dfb4ebaacc3a1677539934c703" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ff50c9d625a719b8e60507330a849cf3" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "f2b8a299c2c52aafbcb33261796e857c" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "9d5531fb05aa08bc0d786e34df07a939" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.24.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.24.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.24.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.25.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.25.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "7f75e212ad547054aa5e7bcdf7d10552" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.25.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "56c9244bd895b6e3d830dd9037bcfdf2" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5b6dc6c4f3a737ac398904aeefd4dd10" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "cad2178cb29af0ff72352f98119afc20" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "53376588da37e9efc6fc26bea813ee4e" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.25.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.26.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.26.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "1c02d9078d5f6d059ed33be2d922efe8" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "f620ca727ae35d14c845ec0d6217d0eb" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "8c7f98929c73dab36d7012450fc7d1e9" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1a976836c14cb9dc9a08aee3c604c772" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "514e89cb379a4e8f8007d8f2fb182e83" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "3b8da83d076efb77f97b05d084a26cd4" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d6f4193121dac71431754de3e6c2f412" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.26.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.26.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.27.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.27.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.27.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "e462f3f98f6ce3d72bc45801fe80970b" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d735049c9de316842434d96468e22e8e" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1abeca7f5bb3d202eaf29ae26f7092b2" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "7b7356ce0d6f53f1ce5080d4f4eb98fa" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e1b3e9e9ed9ccb8cb4804c9cf30ad33f" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.28.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "65c77d460c48c8f5b0111ed40b0382af" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "01f10445dcf40cc96a545f693a9699ce" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "9713ad533de0b17b0811172704ad397e" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f7de36044b9b7ce36cf52c0b87a27a73" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.29.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "b6d123403fd3032765c4358924bda2e3" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "04d6b87e75ae96edba8ab9c74b1d6bd2" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.28.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.28.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.28.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.28.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.29.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.29.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "e9b68fac678bc0e6e3e1bca423f5b813" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2c3652d32baa0fa70cc30ba8a717a4e5" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6260942e5c3a4c58b8177fa5f543737f" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "df4593a8b4d66847415685aeea5df196" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "c4b26c9028348cc952a8db39ba577a1b" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.30.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9b00540dc5dfa455428b4fd7f9887281" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6baf43f6660dcbdfd927b74a778b1f8a" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.29.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.30.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.30.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.30.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.30.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "c3771b630d9e120361754c667e73f926" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d5e49b611d8dd90032c14d8bad444e3f" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "072f600c83dd87691ba15637a16987f3" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7e4072ea6b4374770b43a25915a827ef" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.31.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dd8da534be61052866b3be533ad3fa09" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.32.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1096bcff6ddf13fb022ae57893e323d1" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.32.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a95182c11ad6d959d80cc69df890d882" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "750fe17d270159db413eba2594574271" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.31.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.31.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.31.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.32.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.32.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.32.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "8ebcdb07ab0864953d97ed7d26bbd92b" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c260e1e10f0bf7a1a6440c462509a397" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "3072dec48821158f5a44a161c83263e5" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6bfef55f35a71166c6a4c06ecb3fee36" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "87ba1ad4c1bdbcdafc3695f8eb35dcbb" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e75590b3c9263625d309aba7a8efdd80" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "31fa84128ffd0d173b5bd0d73c12b96c" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.33.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "75490b43eaa6abd9b8b4563f01f96fc3" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d3958978275ee7e67fb9a0da561a81f8" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.32.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.33.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.33.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.33.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.33.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.33.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.34.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "a1916ee08636c2da4a18dc62421a05b8" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "36d6d7deca545c1430c7bd736cb9d580" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "6ace2c74cce6df5c2abed402949ddfb3" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.34.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7fad98ef1fa0e939a64977d4c57a3488" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.34.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5143e69fa4c1c532f6f218fe19aeb215" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.35.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a73f8937d3ddf9cdfed6f49f5f6ea6d7" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "24efcd17a1378c1344877d8dac0eb9dd" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 23535616, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.34.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.34.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.34.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.35.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.35.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23519232 + } + ], + "md5sum": "1d41359467232e8e24b666e8d665da30" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "090a9ecf851c094b20fa9236a41632d6" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "04ce4ebc8e6120ccaf0e7552854d8974" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.35.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d19d0977af3c4a681673eb633c0047d9" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "74424afa70c29cafc8e7a865fdc2c4d9" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c7d8bc397612de310b4ed88760da9a4b" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "9b51bb61a3f18f369dac7627f2306f7d" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d29a563b2e04092418c93ef3d389d897" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.36.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "2a4db3e8e339e12a08f168e9ab7410e5" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.35.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.35.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.36.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.36.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.36.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.36.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "dceb99b04557c2f93441665fa412aa88" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "9f2c6f58dc07725b8183ee5d3ef85a56" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "931786a7bb9742b184577d88b8e25061" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "6b667ec0cb046ef92005427bf0e87df8" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.37.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "fe0d95f97c12ae0a6aecb016103d63a2" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.37.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "26bf2cc42f00a33189aaca19ba69dc9f" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "133be4513fbf1b4b0e4c06fd8edc9143" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.36.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.37.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.37.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.37.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.37.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.37.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.38.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "1efda9072cace9cf085daa35f891ef17" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7e55426bfaa94c62746a4097983e6c61" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bb56929a06e19c2d131b86ea1491f4a3" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.38.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "413309456c3674fec2d2e928a7339d83" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.38.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "41fa6b836b228c6857cf3651ae09fbe3" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.39.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "8e8a353b3279af34f5582e07d0ffa152" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "9651dd7ade4fc4be04bb5ee4ebdd3394" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a1a0bc200f3e046744bc215e2096c824" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f67dc4f9b7b69e6c0d7d49e05b93c667" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.38.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.38.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.38.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.39.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.39.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.39.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "e0293237ac7d5adf194b10e818ffe014" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.39.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "246184c722b52a63b8bc059c10ecccbf" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.40.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "13dffac87029c6775ebac18a195c325c" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.40.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "eeb9e3e631c6a0df8ae7b53e07451ca5" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.40.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "307783c4dbf9dff08003e17dd8ab160e" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.39.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.40.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.40.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "23386020ae0ca30a1cdf25202c8a3bdc" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3fbd97f50a2e80a222aa07675f64b842" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "62d18bf057596ff25e835f14f3eb9875" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0b8965e44e28ffc1321797dc1210b076" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c099b73da0b82588d5dcb21b5cc278bd" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "3287d25fa4eaf9eb3a6c2afe3ba54a4c" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0c52f14416bbcd9c385bf208beb40536" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "96ba279f2b5eeb0c5e27cf685fd0554e" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "30395ca474e35a0230f629b0a5de8f50" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.40.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.4.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.4.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.5.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.5.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.5.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "21be87652d14b58f9ca256356e045266" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "ffc4803d18a7c02c12b48c2a68747179" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b5d744a2e9e24e65c1bc4a017be7d5ab" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "364e23efba4a4359e63ef4df58088409" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "112a49e419e7cb3b474b40e4ceffc9fb" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "967cf985d65f70ee168752fb7c5ed10e" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a886f3cca2aee32b2466227328e52884" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.40.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "4bb488d86e161f7362a535a99231ba28" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 26910720, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.6.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.6.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.6.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.6.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.7.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.40.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26894336 + } + ], + "md5sum": "3d4431ef0e2812ee9f85a6d3fd4f72f6" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.41.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "82b04b74cd94a10fbfe3e805075b296b" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c8bb50e3debfa041bd35769d6e6386fc" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "205cc818e9f2cfa27a5a059c163c7f12" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.41.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "fcb4886d2faed3ae53bff82634287a1b" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.41.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9f90e39a55c142c1a26834addea8e585" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "0a2b2d3e7e00ee7cf6017c46a20be908" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.40.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.40.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.41.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.41.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.41.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.41.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.41.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.42.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "e44b8cf5d2d86d1e38b674cb1422b358" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d70fa0fc51c370f3b66e1e90ae88b72c" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "2e390caec19bda3c41a0588dab2f3b1a" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.42.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "34dbb3366ee6f4f9a4e616412323a0b9" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.42.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a232895b056065df89708f660ca7eb6c" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d1853c33dc2de244586dfe8fec5057cd" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "9d80a8dfc234a3ee8b39061f199a56b2" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.43.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "378e19ba4390382462c8508717d721bb" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.43.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "41c1da2fb3b08594e8f38de8c386a856" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.43.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "fdd7f0d1e78f8e247585a35f1953308a" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.42.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.42.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.42.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.43.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.43.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.43.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "dd7e5f56013d7017fd54aef283c1964b" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.44.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "a90efa1dc93c042d1c524061f2b11b2e" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e7b15a8fd669f2b0f0604bc92829646a" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "111021fc197b6361004a3536e06bcf76" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.44.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a20bd82a696f4f908368c1167b7f0ab0" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.44.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5bc6ffdb43b8d88dc7ed2ab0f369dedf" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "a44ab7b38bb5593b216c6ca663271e1d" + }, + { + "dataPath": "params_shard_242.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.43.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.43.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.44.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.44.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.44.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.44.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.44.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.45.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "f99e4e524c97995a793f704c722a50e1" + }, + { + "dataPath": "params_shard_243.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "337b85e0eda6bd79d6d80871aefb0156" + }, + { + "dataPath": "params_shard_244.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e1032e51eaeb6374db33368c724f996e" + }, + { + "dataPath": "params_shard_245.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.45.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "27a0518359f0e23091c9d4c39d47d2aa" + }, + { + "dataPath": "params_shard_246.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.45.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "c55d58b8b568acd4eeeeed77233a73d5" + }, + { + "dataPath": "params_shard_247.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.46.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4a31c9ad18e9b06edd5f9f0ee0b008a1" + }, + { + "dataPath": "params_shard_248.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.46.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "eb661117f8068611fe8d4d9474ee32f9" + }, + { + "dataPath": "params_shard_249.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.46.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "864d10717312494dd95cc4481efdc888" + }, + { + "dataPath": "params_shard_250.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.45.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.45.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.45.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.46.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.46.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.46.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "56e2d2b23aae86fd26868bd7ebe131b5" + }, + { + "dataPath": "params_shard_251.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "a5726012e1f622c5c27beea36941639b" + }, + { + "dataPath": "params_shard_252.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "72623bac2b2d1853b685a44734e39531" + }, + { + "dataPath": "params_shard_253.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.47.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b3f77cf29a14122728f4f79909b978a0" + }, + { + "dataPath": "params_shard_254.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "99d611b1b6d4ffc5d37adffd61f74967" + }, + { + "dataPath": "params_shard_255.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "2a8e32e8b9a1c13d611939a22e9ac6d6" + }, + { + "dataPath": "params_shard_256.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.47.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4122e864361bc7070e55cc173596a6cc" + }, + { + "dataPath": "params_shard_257.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.47.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a15642d0bb387e4218f5fb134fa08e84" + }, + { + "dataPath": "params_shard_258.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "5df611f8fe76ea4752150ced560f3cfc" + }, + { + "dataPath": "params_shard_259.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.46.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.46.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.47.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.47.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.47.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.47.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.47.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.48.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "37a1872c9fb9076452dc28df6adb197d" + }, + { + "dataPath": "params_shard_260.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5b913c84c2d02344b3a0cef60220a8f3" + }, + { + "dataPath": "params_shard_261.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "418ec4724e682c540a745b0f31292122" + }, + { + "dataPath": "params_shard_262.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.48.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "69d6a2f214ca48eb07d28545078b163e" + }, + { + "dataPath": "params_shard_263.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.48.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dd9445df4b0362cba30d76ba9bc3caf6" + }, + { + "dataPath": "params_shard_264.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.49.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dde62871e184a48293dbe50488a50d74" + }, + { + "dataPath": "params_shard_265.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e0a14db14bb750a8d08a94f841fe16cb" + }, + { + "dataPath": "params_shard_266.bin", + "format": "raw-shard", + "nbytes": 23535616, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.48.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.48.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.48.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.49.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.49.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23519232 + } + ], + "md5sum": "99e4d3ca98ba68fe20dfa6d89d3a69fd" + }, + { + "dataPath": "params_shard_267.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "9cb6222036cadcf44dca1a6e27533776" + }, + { + "dataPath": "params_shard_268.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "204c9d46384c20b3f0fd950b6b7e207f" + }, + { + "dataPath": "params_shard_269.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.49.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "cbaca1c48faac93b6c4ae3bd2d13d4fb" + }, + { + "dataPath": "params_shard_270.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.50.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b7e0265b608fbada3377d6371769c9bc" + }, + { + "dataPath": "params_shard_271.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "2eecc52e6418582b8fbdaafe10d6ca92" + }, + { + "dataPath": "params_shard_272.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "384cdc8d17fd72fbaca68fffbfb00c1b" + }, + { + "dataPath": "params_shard_273.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.50.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "8c6c6fc533f6b6647353e2491ac5e2f8" + }, + { + "dataPath": "params_shard_274.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "82b95f3d47f9e4912164cf4d2a84d948" + }, + { + "dataPath": "params_shard_275.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.49.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.49.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.50.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.50.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.50.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.50.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "1f6ed72bce5972e6bd43974b936d32df" + }, + { + "dataPath": "params_shard_276.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.51.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "abf4053c2d43731ffe989458af7b84e9" + }, + { + "dataPath": "params_shard_277.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "9f2341772fef8c7927e75790099e24f7" + }, + { + "dataPath": "params_shard_278.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "4e60b7668cb2192bd4ee6ed7437ef3af" + }, + { + "dataPath": "params_shard_279.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.51.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e4e2aae29ca45ac16cf47576f798e1be" + }, + { + "dataPath": "params_shard_280.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.51.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "48d90ef125f738aadd8323eb22044dd4" + }, + { + "dataPath": "params_shard_281.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "73f8ae6756366770f959de32f6e05af7" + }, + { + "dataPath": "params_shard_282.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.51.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.51.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.51.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.51.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.51.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.52.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "eaeb795213ec722f1932eb275f56e24e" + }, + { + "dataPath": "params_shard_283.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "cfe61800881204bc1c668afbad39a5cf" + }, + { + "dataPath": "params_shard_284.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "31e0c233b0b00bb150ff8499d36d6b87" + }, + { + "dataPath": "params_shard_285.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.52.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "721dcb184e38db8007544d5ce4972fac" + }, + { + "dataPath": "params_shard_286.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.52.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "463990557c6599f84d6b261116120dab" + }, + { + "dataPath": "params_shard_287.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.53.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1cf363444055d2902da975d536371020" + }, + { + "dataPath": "params_shard_288.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "aa120c9b248911e2cdf7a64ab0ea6aea" + }, + { + "dataPath": "params_shard_289.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "16a14156860e391f0467f12327e238f9" + }, + { + "dataPath": "params_shard_290.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.53.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dd35daa1b81db0eb59f4c65bbf658276" + }, + { + "dataPath": "params_shard_291.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.52.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.52.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.52.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.53.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.53.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.53.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "e4c5f95ad2701383915ba4b5debe3d1c" + }, + { + "dataPath": "params_shard_292.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.53.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.53.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "7fb05ae33a23dbe959faf94ba0729181" + }, + { + "dataPath": "params_shard_293.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.54.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "97c0dcbbdfb4b25ca32ba04a998bdedf" + }, + { + "dataPath": "params_shard_294.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.54.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "2a773802c7964b23b61cd52c1a053615" + }, + { + "dataPath": "params_shard_295.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.54.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e732aad57642f56fde62113c3bdd5e59" + }, + { + "dataPath": "params_shard_296.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.53.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.54.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.54.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "ea47b8cfcf64c4f527041d2168018c09" + }, + { + "dataPath": "params_shard_297.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.54.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "009e9b5894c5c6625135293de848fc9b" + }, + { + "dataPath": "params_shard_298.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.55.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "0c60fb8a32f8b80388156bed84ea7578" + }, + { + "dataPath": "params_shard_299.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ffc5ef164e2745e0607cba78dd6ac08e" + }, + { + "dataPath": "params_shard_300.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "4ef1bb28f020dbc92adab242b17971b6" + }, + { + "dataPath": "params_shard_301.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.55.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "5d9c944750569525a9c8237d60354074" + }, + { + "dataPath": "params_shard_302.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.55.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "66ec3bafdf8482810a0cbcc559f1d175" + }, + { + "dataPath": "params_shard_303.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.54.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.54.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.54.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.54.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.55.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.55.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.55.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.55.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "945e6e634a6e7d61afb04c17168a40d9" + }, + { + "dataPath": "params_shard_304.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.56.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2aeb274bc4408e94efc81c12848f36d2" + }, + { + "dataPath": "params_shard_305.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "8a3fa570bcb65a3d27c3f1d7853802d2" + }, + { + "dataPath": "params_shard_306.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "db5d9c87f75d9b995144940d3496e071" + }, + { + "dataPath": "params_shard_307.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.56.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7262d706b138f55f290e0704f8fe1a7f" + }, + { + "dataPath": "params_shard_308.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.56.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "76369fb49a3f6574c441f2478f77146e" + }, + { + "dataPath": "params_shard_309.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c59a9fae455cbdf91381b9a3d705d7d7" + }, + { + "dataPath": "params_shard_310.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "346ab1d8f32be50516476f83a6d566ec" + }, + { + "dataPath": "params_shard_311.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.57.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d8bc38770451c90e41f3b5da34b48a77" + }, + { + "dataPath": "params_shard_312.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.57.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "eb6703a1211505bcd6d6d5d731ef4223" + }, + { + "dataPath": "params_shard_313.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6358a1f2d70af7908d5200bac99f756d" + }, + { + "dataPath": "params_shard_314.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.55.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.56.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.56.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.56.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.56.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.56.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.57.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.57.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.57.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "8c5fb4f4830463da77eb464fb33aed0b" + }, + { + "dataPath": "params_shard_315.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.58.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "890bb8da90c8305b23663a9592d8cb4e" + }, + { + "dataPath": "params_shard_316.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e2dbb774beff377aba55b1464630b0b5" + }, + { + "dataPath": "params_shard_317.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bc24c80118a7384e1a05d6c299396fc3" + }, + { + "dataPath": "params_shard_318.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.58.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "df02798dbe3b68df547a25d2dea4ea5a" + }, + { + "dataPath": "params_shard_319.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.58.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "0e4b8d23d6e3016addd27cfadb15b4ae" + }, + { + "dataPath": "params_shard_320.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e1644a38f4377b2133659057c26656ad" + }, + { + "dataPath": "params_shard_321.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.57.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.58.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.58.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.58.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.58.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.58.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.59.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "e58f78db8061117d4f943da8058f595e" + }, + { + "dataPath": "params_shard_322.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "8c4a26941355be0774ad93d7cf2e43d1" + }, + { + "dataPath": "params_shard_323.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "512435047ef43ac6185a3c232fa825fe" + }, + { + "dataPath": "params_shard_324.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.59.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1903bf321465a3f3fe3dcf1e87eb53ce" + }, + { + "dataPath": "params_shard_325.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.59.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "85c735b79382f0d3c095e8924144b099" + }, + { + "dataPath": "params_shard_326.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.60.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dcc24a2db8d5fbab64df08db38f6d6ff" + }, + { + "dataPath": "params_shard_327.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.60.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "87fa881f33c536c05ae0997264d12b59" + }, + { + "dataPath": "params_shard_328.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.60.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6bcbad11d1c589fb246304821764de0c" + }, + { + "dataPath": "params_shard_329.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.59.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.59.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.59.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.60.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.60.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.60.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "8c7bc7c113bd359e56ab1489eca4315c" + }, + { + "dataPath": "params_shard_330.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1cb6cd024cd0ee0f7b2782057c6e05ec" + }, + { + "dataPath": "params_shard_331.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b8a12b06c74a51d0b5e8c94cca636ab7" + }, + { + "dataPath": "params_shard_332.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.61.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "73673e599c5af53b99faa2be01beddbb" + }, + { + "dataPath": "params_shard_333.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5854e21316be164d5042a10ccad969f3" + }, + { + "dataPath": "params_shard_334.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "1dabb52b3783ee944acbbc62549c1db6" + }, + { + "dataPath": "params_shard_335.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.61.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "343dbe4061269298057d26ab42b20d52" + }, + { + "dataPath": "params_shard_336.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "cf02c64fe7fc06573cd3992f48823b66" + }, + { + "dataPath": "params_shard_337.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.62.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1ef41340f537b5bdee6b0ca5fbbb5cd0" + }, + { + "dataPath": "params_shard_338.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.60.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.60.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.61.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.61.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.61.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.61.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.61.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.62.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "c8effcdf5f9bd9c748516dcf513ad5f9" + }, + { + "dataPath": "params_shard_339.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "81433b5aaa936f7c3df008e630e0a97f" + }, + { + "dataPath": "params_shard_340.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0b8ca52fc7369e462eb9182bf0a7807c" + }, + { + "dataPath": "params_shard_341.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.62.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "07670440e1139021ef417000c3cb7ada" + }, + { + "dataPath": "params_shard_342.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.62.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "c8f69b27fcfafae9e2561c7e87b06f46" + }, + { + "dataPath": "params_shard_343.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.63.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7030654e7c0fce24d48eb1d6e7977ba2" + }, + { + "dataPath": "params_shard_344.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.63.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c519f5aa272d7010b3af0c202fe59d94" + }, + { + "dataPath": "params_shard_345.bin", + "format": "raw-shard", + "nbytes": 23535616, + "records": [ + { + "name": "model.layers.62.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.62.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.62.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.62.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.63.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.63.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23519232 + } + ], + "md5sum": "1cc586e81617850f5cefeb8c842596da" + }, + { + "dataPath": "params_shard_346.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "441aa892ff6ff5a0006002086db77e50" + }, + { + "dataPath": "params_shard_347.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "dd4916180eec5a91ee70338d9cf4b4ec" + }, + { + "dataPath": "params_shard_348.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.63.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "78c87f1cfbb4cb62a529e29daac36759" + }, + { + "dataPath": "params_shard_349.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.64.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1e9f9fbd8b6fa2fa4ffc0c7803ed9b02" + }, + { + "dataPath": "params_shard_350.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "30a1037542d3c0247f7ab752ab05cb66" + }, + { + "dataPath": "params_shard_351.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0e2fbffe95233136ea3d978166d7c9e7" + }, + { + "dataPath": "params_shard_352.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.64.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1b9d336b2ce8a05dc5d51c287746cfe4" + }, + { + "dataPath": "params_shard_353.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.64.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "c57da21fe1223ace8f564e77a16430bf" + }, + { + "dataPath": "params_shard_354.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.63.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.63.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.63.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.64.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.64.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.64.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.64.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "d2e87920bfc92d5306dab5a503c071e9" + }, + { + "dataPath": "params_shard_355.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.65.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "88c6deb7d76095aa900e51bc8e92728d" + }, + { + "dataPath": "params_shard_356.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "42e5d998cada889d99aec0137c7c0cdb" + }, + { + "dataPath": "params_shard_357.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "57a8edbe44224038b14c16a8d4232ebd" + }, + { + "dataPath": "params_shard_358.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.65.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7762817c7fc469e4e87a5a6877553267" + }, + { + "dataPath": "params_shard_359.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.65.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "c264d231c260ea9d01857049da2bd069" + }, + { + "dataPath": "params_shard_360.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.66.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "405208a8b62a6276b8f49b0c4022a432" + }, + { + "dataPath": "params_shard_361.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.64.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.65.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.65.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.65.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.65.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.65.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.66.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "eca36381ce342277736014bff63b42fd" + }, + { + "dataPath": "params_shard_362.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7669a16ec17357b2594f0e7571f397f4" + }, + { + "dataPath": "params_shard_363.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "38a4770e66d099c3b732998fb605461e" + }, + { + "dataPath": "params_shard_364.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.66.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1e145d23a3ea500bbb88870d0295a417" + }, + { + "dataPath": "params_shard_365.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.66.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "f707ba4d3e6de9063f77a16764cb515a" + }, + { + "dataPath": "params_shard_366.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.67.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "60f6d4baf354dc15af5e9d1126a53040" + }, + { + "dataPath": "params_shard_367.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7fcdbadaed1798416d9e06d545aa2eb8" + }, + { + "dataPath": "params_shard_368.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a9e710e88891c6c10cf60eab90c43727" + }, + { + "dataPath": "params_shard_369.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.67.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a4088b8125a0a2678bd394ec384dcaea" + }, + { + "dataPath": "params_shard_370.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.66.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.66.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.66.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.66.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.67.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.67.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.67.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "5ed662a1fb2509355a37077e624102c2" + }, + { + "dataPath": "params_shard_371.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.67.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.67.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "32b48c1de505123bd44d72d8ea491ff2" + }, + { + "dataPath": "params_shard_372.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f7334b0662bd1f6274a0bb08bb4dfd27" + }, + { + "dataPath": "params_shard_373.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.68.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f874212147c859e4de8eaff13100a9c5" + }, + { + "dataPath": "params_shard_374.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.68.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "06d0dcb2cd121dc3bc732437c9e7b583" + }, + { + "dataPath": "params_shard_375.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.67.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.68.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.68.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "691002f3b73faba9cd1383bd0c0aabcc" + }, + { + "dataPath": "params_shard_376.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.68.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1a6bb88ff4e11cbdacf129b17a1dcab5" + }, + { + "dataPath": "params_shard_377.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.69.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "52434c067d0477d95008346623bd5fa6" + }, + { + "dataPath": "params_shard_378.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6799b4871a0719f52482c0ac334b32f6" + }, + { + "dataPath": "params_shard_379.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d4f0c83d0d66ec47c4ce441b7e11af98" + }, + { + "dataPath": "params_shard_380.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.69.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "defc1746013d5ad6370379b021c70b4a" + }, + { + "dataPath": "params_shard_381.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.69.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "04c148f16f5ef2e7f735b1c1dbdf6e92" + }, + { + "dataPath": "params_shard_382.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.68.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.68.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.68.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.68.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.69.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.69.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.69.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.69.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "8646fad5200b90738c013de5a1462c7b" + }, + { + "dataPath": "params_shard_383.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.70.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d2f2fae4625f9c97d5ff058dfd393fa7" + }, + { + "dataPath": "params_shard_384.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e21808f1b03a49d410d92fc43e04a480" + }, + { + "dataPath": "params_shard_385.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "5a3a73321cbe56e7d32b9bc50e490baa" + }, + { + "dataPath": "params_shard_386.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.70.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f1c283ca2db2f16e7d7e4dc9e6f20b97" + }, + { + "dataPath": "params_shard_387.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.70.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9964fa426c0b9bf3855c889653a370ae" + }, + { + "dataPath": "params_shard_388.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "22b1bd8146d711aaa45c4c67f3adc368" + }, + { + "dataPath": "params_shard_389.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "aa512f4d5f0a5dc084bbebd1314177fb" + }, + { + "dataPath": "params_shard_390.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.71.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "96b66505157e4f5eb3eae83ab01b6809" + }, + { + "dataPath": "params_shard_391.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.71.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "7f4d8c3661d54c12375cea5e82719c13" + }, + { + "dataPath": "params_shard_392.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "93a77430091259c5e5c2d2700147c2ae" + }, + { + "dataPath": "params_shard_393.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.69.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.70.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.70.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.70.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.70.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.70.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.71.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.71.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "45bed7d319e2079b1cb6bc284e00056d" + }, + { + "dataPath": "params_shard_394.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "de8630a9a7bb5f67426d86bbfef17f57" + }, + { + "dataPath": "params_shard_395.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e0b9db5b6f78b8e3a6f33898305c502e" + }, + { + "dataPath": "params_shard_396.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.7.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e2f8bea6dfe5deb37f176828d73f86cf" + }, + { + "dataPath": "params_shard_397.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "5ee766f28189128557638fa31f3c7660" + }, + { + "dataPath": "params_shard_398.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "0d6555331560bd6d5961ebdebfb2a24e" + }, + { + "dataPath": "params_shard_399.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "6e0d034ea9812ade840df7d6c32d472e" + }, + { + "dataPath": "params_shard_400.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "0dc2308c9580c8f569475dba5c3ace4a" + }, + { + "dataPath": "params_shard_401.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "bf6f3cd6449cebb8724d810a67f5bb10" + }, + { + "dataPath": "params_shard_402.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.7.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.7.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.8.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.8.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.8.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "7fb073d8ef65a14d27c2396391b00266" + }, + { + "dataPath": "params_shard_403.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "35b5d8437fdfc13abc2557742d651fab" + }, + { + "dataPath": "params_shard_404.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "0ce7c0212a696d1b9240b4c9c0d095b7" + }, + { + "dataPath": "params_shard_405.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "ad0244056ba74064c00a4dd329861e74" + }, + { + "dataPath": "params_shard_406.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "469b77c65c70b748afedf7e7d5cd16bf" + }, + { + "dataPath": "params_shard_407.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.9.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "243f6fc9016298b5cc7265c9b1bd1b8e" + }, + { + "dataPath": "params_shard_408.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.71.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "4fe1baaa4505c481cbc1c162ea634158" + }, + { + "dataPath": "params_shard_409.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.9.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.9.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.9.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.9.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.71.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "3e20a07aceb3e936fc71ab19839c74e5" + }, + { + "dataPath": "params_shard_410.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.72.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d26c4b59ab16b5bb7bafeef24364dab5" + }, + { + "dataPath": "params_shard_411.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b348967819cce122e1a564eddd874a10" + }, + { + "dataPath": "params_shard_412.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "442e764bff1337cc1ba148580128b363" + }, + { + "dataPath": "params_shard_413.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.72.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e112a40a3217efcab796c80c85a038c0" + }, + { + "dataPath": "params_shard_414.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "697cda91e48730ca119e5e48886dbc5e" + }, + { + "dataPath": "params_shard_415.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c7d9ad7bb1ef317339d6861d4aeb478d" + }, + { + "dataPath": "params_shard_416.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.71.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.71.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.72.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.72.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.72.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.72.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.72.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.73.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "d9df58105ac12d01d43a544def9b821f" + }, + { + "dataPath": "params_shard_417.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e35f2c964dc4d65d0ef842fb6eabc44b" + }, + { + "dataPath": "params_shard_418.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "2d3d284def90311f38eb1fb0927b69a9" + }, + { + "dataPath": "params_shard_419.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.73.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "2ecdd8d1095328fadb9d93db10b5ba17" + }, + { + "dataPath": "params_shard_420.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.73.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e51d08a1b3e91ea78d9edb12f3ef4342" + }, + { + "dataPath": "params_shard_421.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.74.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "8f9a2ec8dc45315abf905a9c91d10820" + }, + { + "dataPath": "params_shard_422.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.74.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "f42870934c3b0cd7c761401144b89e90" + }, + { + "dataPath": "params_shard_423.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.74.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "ec6432fa3905810666e36b25a4419251" + }, + { + "dataPath": "params_shard_424.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.73.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.73.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.73.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.74.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.74.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.74.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "c4cac964836ad19afa75316c075a8f65" + }, + { + "dataPath": "params_shard_425.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "aa90471382e008472d96b2f228b6d868" + }, + { + "dataPath": "params_shard_426.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "952ef528cf7cdc3b3e0c0cdc1825d1a8" + }, + { + "dataPath": "params_shard_427.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.75.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "111531a0aa45a2f08af111520e623f4a" + }, + { + "dataPath": "params_shard_428.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1e8c94c77c5e84c6da07d9f37f1db212" + }, + { + "dataPath": "params_shard_429.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "71c07ac9ef1c1b7dc81ddbbd8edb613f" + }, + { + "dataPath": "params_shard_430.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.75.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "42beb051f20350c0147d1bc82f185650" + }, + { + "dataPath": "params_shard_431.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.75.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "cd19750610bdca2ca11bf90b2a87fbc3" + }, + { + "dataPath": "params_shard_432.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e1809cdfd7fa3499de330dba41a69cce" + }, + { + "dataPath": "params_shard_433.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.74.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.74.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.75.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.75.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.75.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.75.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.75.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.76.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "eeaf1d28cc77f240eaf75eb279833ec9" + }, + { + "dataPath": "params_shard_434.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f5963cdf3928fb8c5d0e1d6c7a5e31f1" + }, + { + "dataPath": "params_shard_435.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "8a5d50a733e1649e8961d228689f62c4" + }, + { + "dataPath": "params_shard_436.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.76.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "cbf3d3a73ec723cd9ac00d1f626b3935" + }, + { + "dataPath": "params_shard_437.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.76.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "1ac0c87c33d3c90d02d4e61c1c6bc5d8" + }, + { + "dataPath": "params_shard_438.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.77.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4962b849e576bb88c3cfae59fd403da1" + }, + { + "dataPath": "params_shard_439.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.77.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "99f8f10fbbebc9bd40a3a2a6227bc5ce" + }, + { + "dataPath": "params_shard_440.bin", + "format": "raw-shard", + "nbytes": 23535616, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.76.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.76.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.76.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.77.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.77.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23519232 + } + ], + "md5sum": "ffd2c8b3056dc8062297daf352305c0a" + }, + { + "dataPath": "params_shard_441.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1e215dc0fb22c8e01b0deb25814bae05" + }, + { + "dataPath": "params_shard_442.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "4336195af27abc0284858b229adf6262" + }, + { + "dataPath": "params_shard_443.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.77.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "7d3db9276b91bd6b2a9b873628a071a9" + }, + { + "dataPath": "params_shard_444.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.78.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "8e6261ec272011be178869c5649b9e2f" + }, + { + "dataPath": "params_shard_445.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.78.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "36cefeb759b27f6a13544e1b8f44e63f" + }, + { + "dataPath": "params_shard_446.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.78.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "14ebf5cbc9415a4333ae96ffae43ff8e" + }, + { + "dataPath": "params_shard_447.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.78.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d38dc1b83c1d08ac9492adf4f9d4237f" + }, + { + "dataPath": "params_shard_448.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.78.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "a666053bd43d4cfeae007f7ad201e885" + }, + { + "dataPath": "params_shard_449.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.77.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.77.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.77.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 11763712 + }, + { + "name": "model.layers.78.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.78.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15138816 + }, + { + "name": "model.layers.78.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26886144 + }, + { + "name": "model.layers.78.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26902528 + } + ], + "md5sum": "61b954a9705bb188007d20ac7d6efe50" + }, + { + "dataPath": "params_shard_450.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.79.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "a2f129bdba42e1b88fa255377a4e4cdf" + }, + { + "dataPath": "params_shard_451.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "63295d90d57458c7bfd5adbff3bf0ef9" + }, + { + "dataPath": "params_shard_452.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e3a4f300f4eb2aded96e82799dd79bbe" + }, + { + "dataPath": "params_shard_453.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.79.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "106f42c8ee2141ed4374ea2ded38bd6c" + }, + { + "dataPath": "params_shard_454.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.79.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "2720b4074ed368e43c198d9b7cab8fe3" + }, + { + "dataPath": "params_shard_455.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.78.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.79.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.79.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.79.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.79.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.79.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.norm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "ca160894ac930a68f07df9f312658c7b" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe73fb89d597752ddae3f187bdb965ee0587f602 --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6d20e0b71a37518d4719073be0b9a77610a357bbe5957f830c433c11f9c24e +size 420679680 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2c7d0842af94dbb770c7ec0f697e3cecadb35a5 --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24032d8f6b607fe15cd2bd179b737c0789b1782671e860e51fe2c7cae044bd9f +size 52584960 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee58c69552e79908818acd8119d00942763063ed --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e5cf259458ca3db1cbad9bbc180bb251724aab2a366b2c5a81e9224a6efde0 +size 23511040 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad8ad77378758375aa459523a7dee84fa890ed28 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e7fcfbd37aca09ee84795d1604f92e970f23e2e0d9f8f44b3fe22bf5bb2398 +size 26869760 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..542099ca504044867d22eac0529af896de4b513d --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d2a40b662b35a34d036d771307c0efb198c74be6d5d83e921309a928feb500 +size 31100928 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbefef4286df793869086c4fd935f5d661073816 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83240b129ee575ccea2816f332b5da695bc417f061ac8954dcb69e3ad7e22230 +size 93978624 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d074e5d3b1baeeb730e7dc786f0af4a46ff1acb --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c16566ef3ec5e933c7ceef4d36bbd688b08acbe1d1514989c5c1c4e38917785f +size 188088320 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ac24fab07a237e67ed317ce61fd86abe989716a --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c31d6d3b076796b426f84a61d4d56abfdfda5b9a4517f561b5b884e8f90feb9d +size 23511040 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea3a2b9c34fa1819b32b13aa9e39740aa9ebdebf --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2324503dd8d324a6ef56f1bddb9968cb877678f94a967a7be8b78817ba8cd326 +size 33587200 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..04784a59967cb1161f85d7c2493eb30ad7a6d1e0 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fceb03b3e75b0996319ebc68b99d2efcbb1a6306aa61ebb9cbbb389dafbba091 +size 26869760 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..43c8cf0cbbaf31fd669d3fbe7f34282637bc2f65 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd021f6bb2bfd1b1b08b305bb8dac89484ae290211c1aa659e288a99e4cd4d5 +size 93978624 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc65e48433305df2bb78af66b2b11d00fb71dbd6 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979268ab2e211ec51caf1efcf25aac6be2b68789ba03da41f93ab33cfce63d8a +size 22712320 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6f74bef9a3c5e8509f934cee380e187cfbccbcd --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f90a96635d303a24a763c6634edbff8901c1bcc85998afb2c97cfad3f9373d +size 188088320 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..d63183ae034dc7f24f2b31a34b5c74aa15204464 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca2d29b7d1b48f1d7c7864f3dd43bc5d43377ef2df88b7d16bc0954c11c0406 +size 33587200 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..61611f1cc88dc2301a35a93267c83e8e2df2099a --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881fa8f0089de8aadb51d14eadbaf632a0efd0dbb0b26d2578982cbdc70e0b61 +size 23511040 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..3f094a75909cc6ca194282315a62f90165c82b61 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc99a700fe9141fdc6b2ca3a62e68a7dd1cc4b20d8a0d2d9f006ee6013098baf +size 33587200 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0ed8b5b801ea228ee5bcee3780fc443a0bd2717 --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca8bb8c3dfcc12d5fb046a80630e6bb12e170bfa3d16c24890ad336a6919a50 +size 26869760 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2392f6464799a0841b8a5a0f91588637b907802 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054c2f7a34e1bb3a2c30562927a5a52b2d16abcdba80dd8bd1f3396ff2ba94f2 +size 93978624 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..0bcd2017f0f006b16cfba85c99b900713e4749e8 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edeedf04ce0660e8fa8d56719a727237a09c268ed1d3339c7cb80ac5ce22f145 +size 188088320 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..193258c089be34c0303c008a0e4be483db5fb273 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556568ff581c16e5dfce47ec474c1de58c031399ab382df5676ccc4e6a14d42e +size 23511040 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8eb28c2d47aa44eb4466372756c515e62c34088 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e23d1806463bc8be0d9d1e37541d3e024aa7072234dfa8631e1b990bc4c1e1ab +size 33587200 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4d48abf865bd84a8c25dcb4874f986dee76801a --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12dd50323b7d1a67ea4c35ad6f22c817a0ebe2a78b30800495be4f164253746d +size 31100928 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8f44bccb68b58644648835c502abb8bc215cffe --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ea81a01d6881c017e64a96cba5754b87a945002fbb9294233336a4f9183cc0 +size 31068160 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4c57ffc9112d3491a762a6f52ed1a2dfb868957 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab16cc898b978033c35cb22dcff7f88670246c33e1aa6049f3b8eb91d27fb29d +size 188088320 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a2435a4479ca7dcf2763201d858147ea9d58cc6 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979793a64a197193e1acea2ec25c53d99c092cd09e9f15b610954cb4c887e48 +size 26869760 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8cb9dc6e832eb7e989db652e79096044376ade6 --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605209f18f930aad56674cfc8c76fe13c940282be516d2983d4d1947ca7c4133 +size 33587200 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..cfda105692bf15acfac0e512a0db4dfd6d72aca7 --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4314be88603833c78ee45a0bec47abe4f487addee0ec763a35bcf593051de1a +size 26869760 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..f20deb5576c0755b2ff068b6842c71901a8f31f3 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4e9aeb64c785379827eb283aa0e55cba8cd5e86917c4b2325d2ecc8326955d +size 31068160 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c8920c694556a4b546d89c8e1879b238c027044 --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f365f776ab96a67974c4131a38944d243baee8beb4b4e30e47975b1f83f1af8 +size 93978624 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..867e08c732e2557635c7eded892a11a64dcccebc --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf353049ed569c90559712d5786b1c03b962b827c6344442c8820a10eeb3bdf9 +size 93978624 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..11ea35e67612040a58fbe176233ffef4403a1cb8 --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca081ef6446f865af9c65725964d5eec4a213dcbb4013fc30478a40742fe3919 +size 188088320 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..f04aa060421d0de7cc1ee5df5ab8e6cb779540d8 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8f360de5ac1b0ea51ec1beb34c6e165dce18f121c1f622a7a1ff53d644236b +size 23511040 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..0056500fc3b1e77fcf666d29c645ba4a44125e9f --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721c6de84fb0c40899d6205356b60f28f71c76615b06d91e6042a3243b37e750 +size 33587200 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bf0f7d2283128eb1cc83bc724df4e7eed059717 --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668be9b807c9b5c9a9d10e2413b09f3db7b4863ad03cf7cec220b596addc8ef8 +size 26869760 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..95fcdcd51b3eabb027a0eafd6619c6f808cd5b5e --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a20c4171c8e408541224f58f9c6681b12b95533c109a49311f9993721c504987 +size 31117312 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..986b921df45d337a35bc628432860bb1af64e9b9 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3c6e270217c91be350330961fd0e429a67ae9e747d6162d48c3a7fd4a9818c +size 93978624 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..a39931f81e7770557cc406af76c98f2839db9cce --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1d0de7f92809fab0162ffacc569d8299ae73e608951646900a54a01a1808b5 +size 93978624 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f42c072126e974d8ab326970a1eda2b281607eb --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a0a536d0eb2b0887268e71b6af186a2243cf23439ef92bc1b7991b6697cf0b +size 188088320 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..214924606ec9eac11fee3f771bb90f6d026c5d13 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd21825728eb6912f628d96ba219ec3172f701f970570cf91c9377526babe39c +size 23511040 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b8260c533aa15306e3f4fe9a92e69061a626aba --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf832b6c4fd3af6302a91a16e84d8ac91cdc7a02edbb0b355a7e9f7384edbca9 +size 33587200 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..33898b28c455753ed28b8fc13580ab7c00dafda2 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbbb86d1b157752d3dfc9583afa8fa9a04c6fc0a65183a40635fbe4134f6baa7 +size 26869760 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..97b7f094375e95d54a621e324fc6aa8ef16cc4b9 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062f10a3f1da3dac52b01d0d61b6c8df7166c464ea7978f8fa9597f17ccfdd8b +size 188088320 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c372f59b96df40a7a066c7b9e558d41eefddc52 --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e341cbf9b1bb8aa1332174f018a60a4d8efa75ad2a4d223c60433b389f469bec +size 23511040 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..e23ab285156ce2b3db48332380df0ec673348a07 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e66551776be65fba011099fcba662beb8316e2646d6036f78c2748851102dd +size 33587200 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..f81855dccd56b6fe0b742dfacfa701069e877eb3 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03464fa39a92aa2a38dc640b727e32fccecfb43c5d1499a3c7783f69477b9271 +size 26869760 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c75bc15da31801e45ebeb578bf1e8235f1496cc --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76421b1d416b748f8cc33939f96f759542b630de3030a9b49f3a00a91ad57979 +size 93978624 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..5057a70b3bafe57191c16026fcd82b305901dd21 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5894673c9c10fd1593183af4e774d2f395a8547563a6d1c1bad9a78d7b3ad6ba +size 26910720 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef47a69297755801571ce09ac19a613584e610a2 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da586e76b7d2b772c9c6520e555c9550a395946011ada716819b4d2b689f0e01 +size 30269440 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..c63e1f386792186c2c7c3da095fbe1972c43abdb --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e295458f0886b3a730f39923f1d2ae19d4129ef94615944627ec0e70e807ff6d +size 93978624 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d2b592355528ba7322fd34c5e0674763924681c --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8017dab549f7f8bf2b4db45b2f24a0d1f864c330a87628d79b2745bd2dbd63 +size 188088320 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b4588f932eeebb49c5d7772cef8f4249c62e822 --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa90ecb057f72b32f84287532e077481002570511fb8d7aac4101c0a708b0bff +size 23511040 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..fba760001ff3d3acdf413c3ca3422a9e4b31dce6 --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da2dec12b52a6f96c06d34e6edbb6ea18e5bc6a9838859af6bf03e1b7fe245c +size 33587200 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c9a8a9cb575ef4154f01ae076178934fb55c6a7 --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2199d693276b4f309ded00329ad865c12c1bd7007662c0c223e5434ff12c07dd +size 26869760 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..587a1d230168e84514e297cb46f5c655e84f929d --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a8d8c30cbbf4f7dbd21278009658e0860f4e530137382778e235c68d30017d +size 93978624 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..b768ac5bb4e9f3787d87b068b0c402ca1c68a763 --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d57a5573387588852c203eeea3ea462b184e479a470f9ede9ee08a5f5af01f +size 31117312 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a174aa001e39b6d80e0b10e845c13a34992a489 --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9d43aa0da80979a0712b11355f603f39dddc2390c3ab2623496f503b7f0a02 +size 188088320 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ea3397e98857f745b40b9e40203b3b6b09c3806 --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfac85179fa2d695df83006b4c782951a00ae82cce0d2827af1ef514a818e2e +size 23511040 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..39b7b5410765a398203c6d48fa1d8c74cbb42c41 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470ceddfb34c2f66245f7355d1f0076188270f46807c7d803fb93bbc7990382e +size 93978624 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..65e73bbd7bc191b6b49910ecebe030589e04c6ca --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb014f19e4ac26633cd0b6477cc320ad566d23d3610b6495a0ea932f1488098 +size 33587200 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b4ab64f86c82efeacefb43c76de451821301623 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38a9f06fd941eab0855fd8d358a063fe6f32c87b801d64deddcba026579bed9 +size 26869760 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..e975c61e55f267e3a610a471de41b0c8a9e219f4 --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6a9cd1071ff36be1e4b264c81518ddcc1e60aebef3655938f058ff3d6cdc7a +size 33587200 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddcf9ef3dddefa8a4f2fbcad93940b5e12159183 --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd5667444c75508db8c81c84787d7727805cc238e78a10eeb2628f2a064b5e5 +size 26869760 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..fffd3d2ace0fc5ac8f2eba22340adaaf17945343 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91cbe1054dd80b1fecdcfb5a3faeab6cf74149d677877b24225a4dccdeca5a11 +size 93978624 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fc5ea9c5560c58680e77959c084894faad45818 --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85499445c75cf88541bf46c428e58f2213f1ec2e0937204c03a5762c784efc12 +size 26894336 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..e82dca59182b0a7868b29e80f22f19c44721a5d4 --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b7f6a162ed9531b70ec8c2b7f81139df537aba8912b0e3bc35633154405b2d +size 188088320 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..c457ec8c8034710ee53b203d3a808a75522c8f1c --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143da90e120c98935d4d41010ed2d4d6fa8039637a3defea72d99ecef1e4eb13 +size 23511040 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..665c6f0faecc28627245bacdf3e731459358d8dd --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b2d5dd34579a4ef1f69728631451c91165188d175153dda6dc56b54dbade7d +size 93978624 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..df4c07996bf6737e418a3111c78ebac7d2bff3e2 --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3a4e6f623bd798d6de05458d1956c6ad98c1ec4a3730358355de0e4964f736 +size 188088320 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a2bffdbb3bf4f13c8193ae1f3650dd0a92b3009 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63a7fed63b51a3efe827e96dee2170668708cc948f3e92209780bee07d9e1f2 +size 188088320 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..04e4a3104a700162d643a8f81956d6d52b4bfc90 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27cfae4b9bcdfc6c0d5f9acf325c62fe7f0fe931966170b9bcc77f77cc2feda0 +size 23511040 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..c64303fd843cf4348efd57c915f42deecc3b2a14 --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a9839f35959141db342b70e60b8f1bc4a8de3014e69d3a057a2f39671f3583 +size 33587200 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..00b2ce5fd210dfdd1f1b230df8df859d7ee441de --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08aa7ffc42a79085630d238b3214419588b670341fba0ffd0adf60b299b9fd37 +size 26869760 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..5986aaf5bbfad09f954972b5e8d236879de2949d --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f58c39ff97d13d9bccad4a285d6e722d4733265eb700510c0b949e14a93e09 +size 93978624 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..f87f8ca1ecaf013d64605c76d7a8586776d62d1c --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b8c939a4f5718a7804cbec57579d25c379e92b432ec10744949b1cffa55ad3 +size 31117312 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2019e8006463426369e55a99f84660c943543ae --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4f183af5ab8ad7f0988d41b5513127b1786252323aee68d13f735b5ee33bb22 +size 188088320 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2014e3c35bb7cfc68e2d37e7cd87631a8ad5d94 --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70dc47a46a789d3c14e266e7902eee8b062e9f8ccd02a9f03b5f8c15256208c4 +size 23511040 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..11be48ccadb01f35d9a11e28b93540db1bbc0678 --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364a73da9ff1f9e703585917c31215041e9a41d5cb87c5239a0fee93980bd09b +size 33587200 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc054808e68a6f27d257de35ecdeecdbc1a3eb51 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbdd1e6730f70be82341fa06b83b4d81f253b920efa0c56e9c43d940245c998 +size 26869760 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..545f014ab532ed5fbe5b25f8c34d654d69af7358 --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9299f02d7d3302ff0544154a0a6980aa000e8d7ef7f02e0684bbd600a18012a5 +size 33587200 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd3a6c4f30930da30d2072800bcee250b69d284c --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ebbf540374eff37988a3858a5239198673c684771f9abbe43ff48ecbcf567d8 +size 23511040 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b07482dad0a2dddf70912dbd80cfee0eeb338f0 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe17a0750fcead4beb891a0b6efc34e46b4e90a1df58d272b9f3415a88066e9 +size 93978624 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f663878b936b4d751be05b02865d80d56ffed02 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788a852184708a52e1528abf50bb41ca4b1c846855e4adb8b78c295b0520ab72 +size 23535616 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8fc3d698fcfa06332a802f8a4b56028966bdaa4 --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea072deb424dd6253cb0606182048730c352550adee56c980975eb1740c6f801 +size 188088320 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd7dcb7790b24284fc0508487603a69d410f6c0b --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6730785ddf7d5502cd603dd04bc5fde2d59cf12baa4b29b140eaae2a094688f +size 23511040 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..c03d0d76132a564920a681650c09c4e0b66b9823 --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88123680f4f32e164680aa3b5b77aa3b6a87501e0e93021f23c5e53428df728 +size 26869760 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..156a23a2beccdf632a606318237c375a18ef747d --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219e561f51b23a65469186416342741fdea3d567eaba8afd4297fe3a9d25a376 +size 93978624 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..c19288e4a119a3ff7dfc3739fa29f36287244cd7 --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54152a2799178e2140bde7a8ce98155a3cec1f6ea061a3b4bd15fd1deb6bd78 +size 188088320 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba90afd223bdba699cc2063a7252f11f7a47143e --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d727fe2c163fa5073c92ba86be84093d798a24cf0d5cd7eefb3590cae01fbcdf +size 23511040 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..47eb0e023f5f7550f56223aef8f7913646091b9e --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65b5858bac280bdd3e916c4d6a11ae642a0b705dd45393e7403bd28c3d7a7db +size 33587200 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..7eb4b2c8ec8199a89d63d8007deaa8ad95f75399 --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c2d513b27f60c74d117d88de695ee36d6f743f4b9e7aa83fb3a95aee038fe1 +size 26869760 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..87dd2b8d3192adc3fde74b98250f603cfff97fe7 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2801deadf68714b82a25b4558581af9e412b898b9be17432ece7535c42d09ac2 +size 33587200 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ad27832037f49d144bfa8325c02223ad5795cfc --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c0387d44c64b7aab81f4205335798fc45e3bd14c9924bd7ca37d1a57cbaa58 +size 31100928 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..edae5a78b1bbfe04fd4fa5068abded7bbb816142 --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b0eee397e3498e53ffd3104b088ea41b5ce2d72b8a1c3034ea47a7d1009c10 +size 93978624 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..23265b90afbab51f6803658057c9f2fabff941de --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1303fc3b5a01b4fd3001bc5cb36efdc751f6e9b475e14d37cc20b5d7dc3b897 +size 188088320 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..6005697dcd5b8557bed374d56a761dced321f758 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a15f0917039ba335f9656e87364d06264325ab5b4de397a2f350bd1e27b76f +size 23511040 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..7cc264e25f1367bceaf5d8307adb72704f5b235f --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce55b572e1ef9b5271ae9142af0881d93c2f601134b5393a01bda6e22e7a252 +size 33587200 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b5e6929525b920793ee29a375b947ea5cef9c27 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed4b964d5438acd41de3aa3d7463f57b936d475bf5d3015c8bb977afa46fc87 +size 26869760 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b8fcae249be3c672ca700db20b1dd09b9b8eb55 --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ed68dc9d13f0c565c0dd3c7793778029788c51eea7950df99553a37f164bb2 +size 93978624 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..4186c9edec12c2ba06dfd78ebb72b10fdf5b02a9 --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f4f2049e4ea539b87a6dfac46405333ae95faaf994479c122286ab93ee21f1 +size 22712320 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef1c063f40c2842b1875826cfe84c5dd053b7eca --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb8a6a15cc668f78f6ee31069a666c1a2364b9ef28efa722a8b0dfbac462e7b +size 188088320 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..80807266588497cdb979e50c2436d1b101540923 --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf8c002d16860340c0d908eb9c8f3dbc0257bcb8fe1369d1794453be2adf1c0 +size 23511040 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..b945b3ce4384c5e8face92f2488cb98ed2594247 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a15bf0307872d889cea6e76b048a2295cd94ec870d94371815c7b2fa571807e +size 26869760 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..55d6c8f5be28474d620b8484d84378e52fe534b5 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b38942c1fdcdca0f9ad3aaade8c66113845ba16c10b8b62987530a1f974f29 +size 33587200 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..93d1ae183867b15c094f9facea2b0b7d78af850f --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b4319f158d890da70e0e7c7d9c91988ff3a533f3ef4a029536be8669c92e2d +size 26869760 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c21316ef09061d74f994212f9bd22a98bc1d363 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e22fe249abdd963deedb78146d93380804b96c1beb2bcb662a0584c4a97fa4 +size 93978624 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ef3e14de336c4da8c3b0d69d92023cf4878299f --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7f47a3cfdced2ebc98d3089b606bcf57fdcec722cd5c51fffb4d61e2caad5d +size 188088320 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9e4b20706a61df77e17e13520c8e1a876971766 --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3703eb563f8a8af259e5dcaef34b784b125349e934296616e4b440d528026d5 +size 23511040 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..5246d144a1a54731def4724e5ed58c20502b9cc8 --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd40157db1ceed8376bbb94c915e13fbf8c7eaea5a2859fbd6ecea05d612949d +size 33587200 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..910b1bcecda0b3087d51dbd9692d565c78576ab4 --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cfc768e8f4a80f9903dccc70d697ce71817c6cc6730ee77068e4f782eca5828 +size 31100928 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dd8a3214312f74bcbcff03777dfe832ab6501bf --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf3c857cba0a179886fab12e391fb62de9fa36340d7ccd3a2234b6a820ba125 +size 31068160 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4f3b2c1cae6f8bd4cb7427f0001b2ae1f31bd21 --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f47f33197edf5f464b6b2c6e87e9bdab207f274ce628874e7c0389a3c5b36225 +size 188088320 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c695d4e5f5528807a7771a20cc9fe44d9bfeeee --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde17adedaf05d53e6f191c1a63cde609ec2cc3787b5ca5617823594c939da19 +size 33587200 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b894ed57b6246b45827e6bddc9f3912c9eb84fc --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3572d230ef0254dc9388e6411039a80a2c65d07f1cfbb18b7d0a4398be10b9 +size 420679680 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..b648f0132846bfe5091017124a9b38276a952bf8 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddd3445634c366c3b783522c5dc86495fd722350328358086712ab33bf3dde7 +size 93978624 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e0f8126324abd7c21fe1b92d31e782bc53843e5 --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abbea1100fb36238ca075d449ea6fe1da317373bd4f0b7fe043ed1b361f611d +size 26869760 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..a5efb6e39c51838487ec316ccd4dfe2820c8acfe --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec35a338a45d68d91c493e7e4abaae785db755adcc69db63b3a2cbbab6d1e1b5 +size 31068160 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..29c15051dde616e2f72bf579eb4d7be417e4d6bc --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49e286bda6d1e902cd893074175479752bd841d5929390a2e54950333b45d11 +size 93978624 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..a425be916bc4bff0c14e2e880e90f84efdaf7e3b --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b02b23741d413ec89ba602a9e552887fc5b02e0f08f3d2e55ddb9a2df44580f +size 188088320 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4620f5a479d952aa01760df97a265947660f583 --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c96f96e8dd0bde2e4494d35fc2f3ef6b2767a21671d04408dceb653cafdaabd +size 23511040 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..e5f5398d81dfce3b6a1a31a0af24a5a521dfe701 --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f028faa8cd85138493aaa9d93d814848f8527b7f7be5a3e746c6e676dec223 +size 93978624 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b22fedf3fbfa8ab690cd349afe66eacd2b68cc4 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73fe14e7ec6cbe28373d01421749cd20c77cd497f0765cb67e626800c10c2dd1 +size 188088320 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1b1ee6e933fc6769bd80982a8a72652bca9e805 --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065b9d30becc3b596bfa921cd5a6c994dd65735fb05c3274754811883d536fd5 +size 23511040 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d60e7839e0de2184c80e2fc01c8c939d7e160e6 --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e81425e30337c67fab5814bcf88dd9a676f4dd31f5852deda19b14e4e7b5bf +size 33587200 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef5ba6b83394e8ddc5fe0d1646a576fd3406e4e9 --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062620d18c09525b6b89e934b9c030f3ab30b8e525110752566d3e00dda9d060 +size 26869760 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..7631f78bce93839570029f59b752b6a61b989e97 --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8697b38b1b73e932194205dd150ab470c63ce14fe279f2e6f713487bfcc213 +size 31117312 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1560f10019a521038ab03159ef067b2c2a5c3bb --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71f405242db8354f4db10609df3188c17cbe79e3ef2e8298fc223c459caa102 +size 31117312 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..9795e01b75ed1b91a741a9a4b430aaa4072f5b46 --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4761d6426df0df799284ec365535875285d58de23d556be3c5f12e4c97f8a9 +size 93978624 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..faf6753a2d83709bbf003aa71d7ef8bfd8e1cbcd --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800114d04bc81567673bd97106507971a8391d48af23a277711a9688c2a0a24f +size 188088320 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..252460f9fe07517022d5b1e6d678e93f27bc8581 --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e0af34dae6b6d8bad037c0cf7b45767a7700a87404800ca258720c3db32fcf +size 23511040 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..53bbe06ddeafe0705d3520123f5044cd5224e4cf --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f09389ae1bc3803e692b5d4271d43d9e95c224f235cca1b5270138fc99982ce +size 33587200 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fc45b0ef9b964d38a685ec4112a8e5fd0a0fec5 --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2047f2fcb300293ecf4baac7e361fda74e34fa32d5e6ef45435aa9c8b3db6b3c +size 26869760 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f87de5cf2007076bf0e20beab8663331145a443 --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a8e8a90275c912bc0d5f0022e0cbde4a147350fda25564db140742b0061e65 +size 33587200 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..32d76709fe291794db7dfd9bbd97437320de7237 --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151aaf16fc3022df7cd335b88a3952a44d1d974dc6b582971093a4955c9368c4 +size 93978624 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..74455b454b4747d498f923c23c59c69e03ab1fc7 --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec3c7a3456a50b768cedf568ea7bd5c54bf1c7e5486531bf9ef584d36b98571 +size 26910720 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab5cd52732ac2aaf649c8abd9fa53c82016f09bf --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0575764e2ce991a9d78581bec64c3f823e1c4aade9c55d76ecee260533f5f2f7 +size 93978624 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..249df969157d85ebc8e22d4b9628fc9082de880e --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee70b10f87ceee173676ee3222941e9908f5af7908f90ce4b6a7565bfa2e3df9 +size 188088320 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..34b2f888489e0447aace9095e58d7eeffb9cd6d1 --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777530e4425447e71c4e995cfa3a4c1e735779dc30778fe84c0b70a951aeba56 +size 188088320 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..39afd5870421936c437b45427c4df8041fb0068b --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8bc0fabe177f552d51569fe4f5cab38dbe5a9db3fedf464a6169d89399f5bb6 +size 23511040 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bfff93a80366eca007df21cbd801ac15828e475 --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af3c2d47ef0e91588504bdcdc47a4b7d7accee32a70094f83f6888821874926 +size 33587200 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..913528d73304a66f4dc9846dd4853d3ae15d4f2c --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1aae2d48bbd8e12bcdccf79b14ef2bee40d35ce5ac26f07ff18a10ed9675e9 +size 26869760 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..d027c19fa99102e6fd02c6f1b00b0be42560eb6b --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4e44855a4fac54b873dbd730610674d6e07ad87aa8c8237e4610a0c181e84e +size 93978624 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..f54044dc2d364e59df62ac326686d7c01d98458f --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b24daa545de0f066d209e40c0f7729d57cab0d7777e98e5d85845095d337635 +size 31117312 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..997efc224502608615cee8850341cfaf4273c8ba --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3187edccc0440d0140e3264090d5d257e68fcffbae78367c637a26df0218e50c +size 188088320 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3347d6f85267939f203ba7111d2ff2204870502 --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db7729cf392b845860d1ccbe040ca562f13f86cb82247afad6498a8949a84f0 +size 23511040 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..10d79d2c990dff74b0b19b431b5b2f1cf51b40fe --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78d1bfc3542f5974c97c443c633c44d7275f86fb45ccf9030781a5396a57519 +size 33587200 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..b691505f9c1739c4359e5a5adbd5fabfb7397dff --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e89bb3c94c5e09b90ac79d868e70d9ec550cf44e4ef053cd03c998ca7f9f65c +size 26869760 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..52dfdceaaf57751937ae21eb2449aaae3b3a323b --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f79099b1bbc5a895a275d12c546a144f4b6b963898599f24b49b4ea9fd52b883 +size 23511040 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..843bbb9ed5b3418370706a1629a841b1a9ea3b23 --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d8a8409f22d85cb135209bcffc287605851754741ef10514a8b7c0c52b3552 +size 188088320 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c1d9ad8cdcab9affa6a4d971c1475e4c0fbd9b8 --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376480aa46fd16545d91cefb2a6a1b568307bfa707894687f841201cbad564ab +size 23511040 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebce6014d31551c95d43bb263ea1d0e3d830312a --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e95f179bff7a3caa904ebb084e3bdfa3c74a173d55d7483a88035e9665954a +size 33587200 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..af8770480a83503bffa4c9c50984f996b00408d4 --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed81f85a6e0abeab850abab42514f6cc348ba4502ee19405f17a8ce3d0dbf438 +size 26869760 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee8d6cf937d5d59f237c1945ea5012e0c518d993 --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169fb94600351881c6746f2b760eec78d7be9830d4962e8587fd9eb1617a34b3 +size 93978624 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e11cc6529a1f5a0c59878df222b2b1e239ced00 --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa18217f2d02b4b2ba9580bcc89d0769452c3a6e74f3d899d9ec0d1a1f3d8669 +size 26894336 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..846991614aac844d634e2c657e15242c142aff03 --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6fc8c82223641e268333c7a99dfc961f051255d0f91ad3d835c91f5361c254 +size 93978624 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..f43628b268204d4026578a7b7811b293d86c4552 --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3404ea49b4d36c334e12d3cbd30ec14782aecbd1ad3434adbd88f109deeb2336 +size 188088320 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac048443051aa53b9746ca307a773226c3a450f7 --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a8f3b81d5973e6eb7d26d343bbb7b4e92e07bee6d41812562a0eb1f79a5ff1 +size 23511040 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab382d3a0fdd99839099d31a2302c7cf57bf79ea --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b148378837cc41596d9e630f74764536b4ebc9303f8a5cf8537739f117d72891 +size 33587200 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..5cd123329f2d03db43b4ce1e6e59ae82aa01f139 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea45dd48638a24c385037288e0ccf34e4f00192a4627d326953b762d112d888 +size 33587200 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..62a7a77e287b8ed00eedaac9c10a973bee9c2758 --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a52313065003276bdf3134efb337aee33449ce3f129d970f3964a54e378b064 +size 26869760 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ad369b6d57ed658112d6f150effaa18df28117 --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccbbb5918a44f1175238fbc9122efbb0b5955f4ff04d12c50beb5cd15fb4bab4 +size 93978624 diff --git a/params_shard_242.bin b/params_shard_242.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4deb0284d3ced4d2a3dd7069890ba209adfb995 --- /dev/null +++ b/params_shard_242.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89722975736e810e8e2ac74319bbd9454713abe460abdb8b6d33beaaa6b20137 +size 31117312 diff --git a/params_shard_243.bin b/params_shard_243.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb96dfa301124fd7c60e021def2332d674b87357 --- /dev/null +++ b/params_shard_243.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39f829edcc1a50454b302eaf36b28a9fa6e53773a805c4aab06be55524a61e8 +size 188088320 diff --git a/params_shard_244.bin b/params_shard_244.bin new file mode 100644 index 0000000000000000000000000000000000000000..97e0ccb6600a4428be478bcccc32ca3e6f7c00b6 --- /dev/null +++ b/params_shard_244.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa491c0c9db1d5f4ba1bfc142b7dac7a79365363eab91ddee2b0988c5d1bcba3 +size 23511040 diff --git a/params_shard_245.bin b/params_shard_245.bin new file mode 100644 index 0000000000000000000000000000000000000000..66eaf88cb892614a543f213d12b5ad2d9df5b8e6 --- /dev/null +++ b/params_shard_245.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7dd50a38c559b37060ac644cbee7588d750bcf0469c0a24025516f264e485d2 +size 33587200 diff --git a/params_shard_246.bin b/params_shard_246.bin new file mode 100644 index 0000000000000000000000000000000000000000..11c32b8bdfe95138717d08926288ca06e443aeb7 --- /dev/null +++ b/params_shard_246.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44679cf8fb411cc9a4b37aca21166974f347ec61c484c8b63201056563d79143 +size 26869760 diff --git a/params_shard_247.bin b/params_shard_247.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d6a5928b44d81550eabc1970aef404102e616b8 --- /dev/null +++ b/params_shard_247.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c93b12aba512791f45da867ca1eb7a737b5f8ea46a33b08eb94073dfbd9e742 +size 33587200 diff --git a/params_shard_248.bin b/params_shard_248.bin new file mode 100644 index 0000000000000000000000000000000000000000..67c2f764f5b5fb807af7b12aa9dcbee27bc1abb2 --- /dev/null +++ b/params_shard_248.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34425f037dc9979fdcb3edee4ce40b8a8da2574bf65429a2f542fa9af459dc63 +size 26869760 diff --git a/params_shard_249.bin b/params_shard_249.bin new file mode 100644 index 0000000000000000000000000000000000000000..7bda5dbc5b89617b56978ef1d29d31e6f862a3a8 --- /dev/null +++ b/params_shard_249.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405459356d762ebecfe079dfb661c2c265af79517f5471d43ab2c11315cfbda2 +size 93978624 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..24c88265703c38097ba89c5a0748637fee515382 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ab2b1edb5c3d8eaf53d5cd7c660ea7b63472239c5f41c7d6d1f8a861fdb4b2 +size 26869760 diff --git a/params_shard_250.bin b/params_shard_250.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5dc49d8d8552487f82ffa742f3e0d7911f61d8c --- /dev/null +++ b/params_shard_250.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3c3774b3a9c13f9cc4672ad9f604a848314a76d1f3d7b5df21b8d91009af5c4 +size 26894336 diff --git a/params_shard_251.bin b/params_shard_251.bin new file mode 100644 index 0000000000000000000000000000000000000000..9cab5d01c4dfc06979e6e4bf2c5dd316ebd32b2c --- /dev/null +++ b/params_shard_251.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26fd17445448da9082aa39e0bbb1f37a5b5363fb0dbfa465378963e0e334bba7 +size 188088320 diff --git a/params_shard_252.bin b/params_shard_252.bin new file mode 100644 index 0000000000000000000000000000000000000000..782e0f8acff300cdf4402b8fe601501e9a339ac7 --- /dev/null +++ b/params_shard_252.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e10caaccdb5ed8d18b007febbd9ae52c08703a065566f7f7123b5d70fd369eeb +size 23511040 diff --git a/params_shard_253.bin b/params_shard_253.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e210087b323d390674261fa896a778021827134 --- /dev/null +++ b/params_shard_253.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d704e6636c6b9a05ba12a1772e99519658ec41f3db5f3bdc80b2e7ddb1374b +size 93978624 diff --git a/params_shard_254.bin b/params_shard_254.bin new file mode 100644 index 0000000000000000000000000000000000000000..0744e5d89efe0707d4127b0135f7e2e5605c79c0 --- /dev/null +++ b/params_shard_254.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda957ad1a9896484ebb31e7523ba1fe75f59be6ba8c91b066224fc7df177b1 +size 188088320 diff --git a/params_shard_255.bin b/params_shard_255.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e36f409f3c0f6e15002462c8f8f5b5b31aa16fa --- /dev/null +++ b/params_shard_255.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2da5b94b1d0d1aeb2121cb117b45cbaab0b34a19d983a1a6fcf22f5189de9e3 +size 23511040 diff --git a/params_shard_256.bin b/params_shard_256.bin new file mode 100644 index 0000000000000000000000000000000000000000..4df8810dac24500958dec9ca45f311891ea87548 --- /dev/null +++ b/params_shard_256.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796925b9a03928ba76cd7905fcb60dba26838b17a5091d0b6c017ce52f356857 +size 33587200 diff --git a/params_shard_257.bin b/params_shard_257.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1fdb97c9f71ff6e621c9908dcaedf41e8150947 --- /dev/null +++ b/params_shard_257.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f156737da67bfa1a1c50634167ef3a07ec3d03af6b9915961fdbc34e6153c74a +size 26869760 diff --git a/params_shard_258.bin b/params_shard_258.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ec69a6d2acc76d2223024da75afb557a2fb479d --- /dev/null +++ b/params_shard_258.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b5ab55733876a877539008a01b9dfe47fd618aa7593f999c3db24289e313da +size 93978624 diff --git a/params_shard_259.bin b/params_shard_259.bin new file mode 100644 index 0000000000000000000000000000000000000000..e65a294177deed770ae31f091eafd896f293eab5 --- /dev/null +++ b/params_shard_259.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e69ffc01cde15d450998591808738d5c1d4fea95f3362387ea7ce8f8fb09dff +size 31117312 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..da44183b9e09b2b6a0f9665d638a957ee2325932 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58d13014d389cb59581cd70ee08a9884acc9b0f4936dcb97a6d73e92199389b +size 33587200 diff --git a/params_shard_260.bin b/params_shard_260.bin new file mode 100644 index 0000000000000000000000000000000000000000..6114a5afa6d7b9418e8984dec6afc7c941e8b1eb --- /dev/null +++ b/params_shard_260.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e1991f9f73b87333c05994349603ce1a03df4b41a147bf2240af816ef3061c +size 188088320 diff --git a/params_shard_261.bin b/params_shard_261.bin new file mode 100644 index 0000000000000000000000000000000000000000..3f44031f1cae1451cd4a0d8bfcf13b599e52efdc --- /dev/null +++ b/params_shard_261.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57efb78294a7729e57e501838c06533470f78ed03a7f191def9d941f3ca80f13 +size 23511040 diff --git a/params_shard_262.bin b/params_shard_262.bin new file mode 100644 index 0000000000000000000000000000000000000000..137ad6ee9dafb2335a8784cecbf1abb026903b79 --- /dev/null +++ b/params_shard_262.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6ab645063705e8b2ab1e100196b78c1cb5e4af2db0fed136bd5f3615056532 +size 33587200 diff --git a/params_shard_263.bin b/params_shard_263.bin new file mode 100644 index 0000000000000000000000000000000000000000..55d937820f081dd35035b57f1cf6d30433774754 --- /dev/null +++ b/params_shard_263.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133dd6f48df0ba9394e571bf175ed0625230cf8abe26c7b63b5a61c2a3df0e3b +size 26869760 diff --git a/params_shard_264.bin b/params_shard_264.bin new file mode 100644 index 0000000000000000000000000000000000000000..78222ebe4e2be0363f4d354e09c6cdafb3ee10fe --- /dev/null +++ b/params_shard_264.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b661e1a565ee968e35ea1f7507f505d72ea393a143729edccef9dda6210bb90 +size 33587200 diff --git a/params_shard_265.bin b/params_shard_265.bin new file mode 100644 index 0000000000000000000000000000000000000000..cbef39a308d72a7b54dd803b91fc3bfdff8350a5 --- /dev/null +++ b/params_shard_265.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4c4be6c93912586ef89ff9fcca656750fb497a8289f8681886a96a87f5fcaf +size 93978624 diff --git a/params_shard_266.bin b/params_shard_266.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4cb81433f250f1aec21e60bc2f7c5eee7b91650 --- /dev/null +++ b/params_shard_266.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e770d7a523256f56833458f5331a8fadb3dee571ca7a891db3f839d207d94490 +size 23535616 diff --git a/params_shard_267.bin b/params_shard_267.bin new file mode 100644 index 0000000000000000000000000000000000000000..5742529686cb8853f8bb9a81bf65b8298a8bb1fe --- /dev/null +++ b/params_shard_267.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38a99f481f1ba30d4a38f221358d39cca1b3f465064894aa97ada27c36de5ef +size 188088320 diff --git a/params_shard_268.bin b/params_shard_268.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a2474531966fd4c08c468772b839457127e0f21 --- /dev/null +++ b/params_shard_268.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe48caf80428e02d5227d489888dcd4e166584e0a91bd375ee2498ebdec4f7f +size 23511040 diff --git a/params_shard_269.bin b/params_shard_269.bin new file mode 100644 index 0000000000000000000000000000000000000000..236704dbdad735723a3b525a6219c5f523a1bac2 --- /dev/null +++ b/params_shard_269.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccacbc986f5adef02f58ca193300e5a25e809f84e16dbc78c84d8a8acbf1039f +size 26869760 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1a5b6623e63748854d993dbc87f19785f6aec4d --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2805f1564735f6f999b9981c65fe779d21ba5cc182fa9859866becceba51550d +size 26869760 diff --git a/params_shard_270.bin b/params_shard_270.bin new file mode 100644 index 0000000000000000000000000000000000000000..3bfb8bf2e837c94831164ef87b1081a864a98ed5 --- /dev/null +++ b/params_shard_270.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a15a58562334255a836966a6f4fbf524b5bd9b3efd55215336cf3c8d88d5d3c +size 93978624 diff --git a/params_shard_271.bin b/params_shard_271.bin new file mode 100644 index 0000000000000000000000000000000000000000..5576ca7621203b2fe172e722860cfd8098738155 --- /dev/null +++ b/params_shard_271.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a509ba2c9ceda9f087a2af68cce52ae7d6b78d909b0e4ef657dd4c6f4ede4b72 +size 188088320 diff --git a/params_shard_272.bin b/params_shard_272.bin new file mode 100644 index 0000000000000000000000000000000000000000..79633800554a26a5a35a6496d639448dd18854fc --- /dev/null +++ b/params_shard_272.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8e3358da64df689d97d07fdff69f3c5ea26c88ca239b9042352abf2b160bf2 +size 23511040 diff --git a/params_shard_273.bin b/params_shard_273.bin new file mode 100644 index 0000000000000000000000000000000000000000..52a99db73144a491a3e0c3d07cc0fe394a82d394 --- /dev/null +++ b/params_shard_273.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc00d3bce6adf5cc52440331e090de7c0b1b954e2c996d98386332872ca47b6 +size 33587200 diff --git a/params_shard_274.bin b/params_shard_274.bin new file mode 100644 index 0000000000000000000000000000000000000000..a150204decceef9cf8668a54658d970e26a5e92d --- /dev/null +++ b/params_shard_274.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:411f187a6d04fdd1de23841d8aa1ba98459bf804c6d27eb82274a7e48761bd1f +size 26869760 diff --git a/params_shard_275.bin b/params_shard_275.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1ac229e9b9742b15620341406069463ba9601fd --- /dev/null +++ b/params_shard_275.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee445781aa80e8dc0bc8a9628510422cc91349aa81651781fd88a0a747f56ed3 +size 31100928 diff --git a/params_shard_276.bin b/params_shard_276.bin new file mode 100644 index 0000000000000000000000000000000000000000..7508b3fd13abb3356aa0a657bb5e0882867ccf89 --- /dev/null +++ b/params_shard_276.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31aa8ca46c1d30948b672bda371bfc9189d1f0dfedf1a035170fae021f1294a7 +size 93978624 diff --git a/params_shard_277.bin b/params_shard_277.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4432a5af4aba6ab868b9bb1ba053327189c1e43 --- /dev/null +++ b/params_shard_277.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d62f6480f2c03334c686dfda70de24de4a995d0269fab285ba53dce4a59549 +size 188088320 diff --git a/params_shard_278.bin b/params_shard_278.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb67449b44845a3eb7195ea9cadce7280a44adaf --- /dev/null +++ b/params_shard_278.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b423180915926ce60a13365421935f60e20123a963e67b7abcb7dc1ecc5f5d +size 23511040 diff --git a/params_shard_279.bin b/params_shard_279.bin new file mode 100644 index 0000000000000000000000000000000000000000..67382b3ce65e9d539f9bda1b1bc929fc6916c1d8 --- /dev/null +++ b/params_shard_279.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f57fb0f0e829a8b5769a9ac6371b969214487dfadf481ff535299add1359f1 +size 33587200 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..3dcb7fe70ab778c361b493796d47fedaaa90e0f8 --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a1e3c8c9439900b32ae8fae082e36637f64b34f4e20e2c02f9dac8da959c97 +size 93978624 diff --git a/params_shard_280.bin b/params_shard_280.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9e9b0b5ae396fda196cdf162322307451943afd --- /dev/null +++ b/params_shard_280.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22e8b33a3361b14cee013258e033fd7230b6956a8577ca45759f42967e389cd +size 26869760 diff --git a/params_shard_281.bin b/params_shard_281.bin new file mode 100644 index 0000000000000000000000000000000000000000..747a727927df1f739cef293ddf1343c4de9f7f24 --- /dev/null +++ b/params_shard_281.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96debf4ce4a5b680a5800b9dd47e3c7b2a12ec295c484656ab075d8c89a2536b +size 93978624 diff --git a/params_shard_282.bin b/params_shard_282.bin new file mode 100644 index 0000000000000000000000000000000000000000..81d4aebc89cd0b021bcc730a03709db26a2f86aa --- /dev/null +++ b/params_shard_282.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea67e98558601bf97e210bf62cfb000d86dbfce0d995e12229916e8b21a2e909 +size 22712320 diff --git a/params_shard_283.bin b/params_shard_283.bin new file mode 100644 index 0000000000000000000000000000000000000000..56591f97652164502353d5d405ca19713dfa786f --- /dev/null +++ b/params_shard_283.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4317a982b9d51f31692331d987ffa1deacc33a973b6755309c3cb1d089fa7743 +size 188088320 diff --git a/params_shard_284.bin b/params_shard_284.bin new file mode 100644 index 0000000000000000000000000000000000000000..e33830d00d1964f3ce91fb2b3352bfac9ad60448 --- /dev/null +++ b/params_shard_284.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ab9d33f1b9c60160d194d3671c78f7bd8de2b5c938ab45f8a5fe5d92a91fd7 +size 23511040 diff --git a/params_shard_285.bin b/params_shard_285.bin new file mode 100644 index 0000000000000000000000000000000000000000..386dce84dfb08cebb745c6da4a49debc90d617e4 --- /dev/null +++ b/params_shard_285.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6635189f725e3efe782db882d8542c872dc18f3c868b0a5bd44cb1a7be09bfef +size 33587200 diff --git a/params_shard_286.bin b/params_shard_286.bin new file mode 100644 index 0000000000000000000000000000000000000000..46d2afd7a1ef794a42ac823148c224584b153db0 --- /dev/null +++ b/params_shard_286.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c011b11962a3d74121c725632195a93e32486220ed7be2b553f6fff19aa34c7 +size 26869760 diff --git a/params_shard_287.bin b/params_shard_287.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2e6f1487f3770e3482faa385dbe087cf836a4f7 --- /dev/null +++ b/params_shard_287.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb53d637f22876821429d161474be4dea937313beb416dbe56d3e6a93d826c1 +size 93978624 diff --git a/params_shard_288.bin b/params_shard_288.bin new file mode 100644 index 0000000000000000000000000000000000000000..dac55fce053883f397370476d62519d8535a1708 --- /dev/null +++ b/params_shard_288.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77994f12f4d57556c263adc0a1f790a93f555e6509824805e5756aa7ef4f8de4 +size 188088320 diff --git a/params_shard_289.bin b/params_shard_289.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea5b825c4ead837e2d4551cd32fe167190f9fa4e --- /dev/null +++ b/params_shard_289.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455667931152cd64efacb196a76d21b5a08f10bee9dedf2789efd97bd21b7867 +size 23511040 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4d5e6966066c141f68a341d63f30d51d332b06b --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e8ab6d94988d8cbc2877b2894b72b3be1c21ef1323366b44a14447bf7ef35a +size 26894336 diff --git a/params_shard_290.bin b/params_shard_290.bin new file mode 100644 index 0000000000000000000000000000000000000000..342dff3b0273d0feebb907c9b2995cbfec0e2d77 --- /dev/null +++ b/params_shard_290.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a23632eaf6556af26123a3bec05033be74bc6ab4761cb612085b01a56b2cd6e +size 33587200 diff --git a/params_shard_291.bin b/params_shard_291.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fc6ae2310677514fd2f96509aa3e3f7e333c4af --- /dev/null +++ b/params_shard_291.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102ed4e3375041abaa0793935e764ea3d91282f90732e1998bb39d6bf9d93645 +size 31100928 diff --git a/params_shard_292.bin b/params_shard_292.bin new file mode 100644 index 0000000000000000000000000000000000000000..417ee2bd74413c5d5210077ba374d9f0e074b8fd --- /dev/null +++ b/params_shard_292.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ec4b49a7d29397fafe5bb1e79669497e2ac4bc4022f0e078e982229b180c1f +size 31068160 diff --git a/params_shard_293.bin b/params_shard_293.bin new file mode 100644 index 0000000000000000000000000000000000000000..909ab2f236ee7bf13d9058c48b07e9016ad5d238 --- /dev/null +++ b/params_shard_293.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46bb6ddba2eb13e7ddd9c9ade86190d32757ae48f2b1e507dd6067e15f75a106 +size 188088320 diff --git a/params_shard_294.bin b/params_shard_294.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd89ccb555ae6d1f701de2f2bfd46c13b4e6dd54 --- /dev/null +++ b/params_shard_294.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0ea87d7febf601c6e8ac78ffec9ffc0f0ca18169e2e5b7f7fcb27b3c8a7d21 +size 33587200 diff --git a/params_shard_295.bin b/params_shard_295.bin new file mode 100644 index 0000000000000000000000000000000000000000..81dd4ec65e2c43476017d4b793b07c061ce9fb09 --- /dev/null +++ b/params_shard_295.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef407a9a2d884006b4d622a56d63c2fb5454927eff0e0664ca79f07558197af +size 26869760 diff --git a/params_shard_296.bin b/params_shard_296.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2cb54839193feedbdadc262af974d4333f8e3a4 --- /dev/null +++ b/params_shard_296.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacca7f30ef60f5a82a2fcbbcc6339fcf39c6022a166300a8d939a55a1c57fb9 +size 31068160 diff --git a/params_shard_297.bin b/params_shard_297.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc5558aa6a0a9e3420d57a406dfbc3d1c3da4f7e --- /dev/null +++ b/params_shard_297.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9d239cbef24f222a976a81e02c1d8b8a970f96648c48f96b971c0de557f02f +size 93978624 diff --git a/params_shard_298.bin b/params_shard_298.bin new file mode 100644 index 0000000000000000000000000000000000000000..4eabea4afd8ecb28960fa029c1c770f1ff9b3363 --- /dev/null +++ b/params_shard_298.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b6cfb8de52fa7d65756f0145b67b94baa16f5ef232f6842c000bf4f0fe9c00 +size 93978624 diff --git a/params_shard_299.bin b/params_shard_299.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc7af85a4dc8a8d1867f345cca0329451f9148e4 --- /dev/null +++ b/params_shard_299.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c47e83e5362059ad66c5ec6bc05349f4cfb89cc8ae115859d692be9e3403c4 +size 188088320 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0d0c40177852cd3da8323c990a0ebfa6663d301 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af45dafe25475a44cdf20e315d89640ed50ed292184737007200bfccc4a6365b +size 52584960 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..d9cf00cb02403b0a12be1db263c7a088dba6b8b8 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17dc58b7e7339f6b62166cbd89ba7bc28a910c343d7b2ab5133548ea9b31f9c +size 188088320 diff --git a/params_shard_300.bin b/params_shard_300.bin new file mode 100644 index 0000000000000000000000000000000000000000..c61f8f973e222b2d32bab255aa4a5d1a645d7a0a --- /dev/null +++ b/params_shard_300.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff385f15f0aa10023cc8330867e8e82acb7695fd8f1626fede4593b49b4d6a6a +size 23511040 diff --git a/params_shard_301.bin b/params_shard_301.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f68e334701ea0ba594d7cd0efeb36b505afb01c --- /dev/null +++ b/params_shard_301.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e303fe9cbf8b1960a6ded6872503aae31293c0daf273502420eec3ea6cfcdc42 +size 33587200 diff --git a/params_shard_302.bin b/params_shard_302.bin new file mode 100644 index 0000000000000000000000000000000000000000..0270355cbfb3cde6c992d74047ed557344d0a88f --- /dev/null +++ b/params_shard_302.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf756c553d4fca28abadb7630301d0f76e0b4ae669c3ddf4a8bb0af4fee30d19 +size 26869760 diff --git a/params_shard_303.bin b/params_shard_303.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8edc1fb158e036105d87cca5481de161ea5d0aa --- /dev/null +++ b/params_shard_303.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7de56157cca4dc586679654fc8625a24d557468d34265ee1692f82bafd53567 +size 31117312 diff --git a/params_shard_304.bin b/params_shard_304.bin new file mode 100644 index 0000000000000000000000000000000000000000..b94d1f66244309f8124c2dfecfc356c5c54a5180 --- /dev/null +++ b/params_shard_304.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c553f4c644901e7577a16c22d771e2169245dcce5e08b03e4cc41e6eba98cc +size 93978624 diff --git a/params_shard_305.bin b/params_shard_305.bin new file mode 100644 index 0000000000000000000000000000000000000000..af63542acb892540c834cdea84ee93feb71059a7 --- /dev/null +++ b/params_shard_305.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57064a8561acdfc4529c47650d12ed81d557bc6edc6ac397779e478e6457cb15 +size 188088320 diff --git a/params_shard_306.bin b/params_shard_306.bin new file mode 100644 index 0000000000000000000000000000000000000000..adccb94e37c4e23c361c3a1806831e9cba6253d7 --- /dev/null +++ b/params_shard_306.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d93d16e2221eb2e4230d68b9f07204e7c97eee3e288e5b6ae0c33df809069dac +size 23511040 diff --git a/params_shard_307.bin b/params_shard_307.bin new file mode 100644 index 0000000000000000000000000000000000000000..db1a3dd955f31b99a3ca0aff9bba9f158022681c --- /dev/null +++ b/params_shard_307.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e634b6873d1fa0be2d4093f758d0089c627024262bf635faebdb385a7fc867 +size 33587200 diff --git a/params_shard_308.bin b/params_shard_308.bin new file mode 100644 index 0000000000000000000000000000000000000000..519e3663faf2670bf46ba199da5937cbf113e1b0 --- /dev/null +++ b/params_shard_308.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e10e88bd4f4eb04aa2674cc23eab5fb27e7615c100147506f94a712356ef08 +size 26869760 diff --git a/params_shard_309.bin b/params_shard_309.bin new file mode 100644 index 0000000000000000000000000000000000000000..c547659a3f839589755587a4a06666854ca564b1 --- /dev/null +++ b/params_shard_309.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ad658b8f06a9c8269d367f6e175114b040c5ebdc08a66cb137fb058b8e63f9 +size 188088320 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..aacebf52f85adf8e4a73c47965d2c1904245af97 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f61cf35eb3ceaaf463280f419facd029d3109b90667e6257d03848436e6494 +size 23511040 diff --git a/params_shard_310.bin b/params_shard_310.bin new file mode 100644 index 0000000000000000000000000000000000000000..56c8af5f6276641c4efbea44ed50e24576ad6876 --- /dev/null +++ b/params_shard_310.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3711d3bfa8d935706d2209f3c359c452872570d706f81ba608a411b0f1885e2 +size 23511040 diff --git a/params_shard_311.bin b/params_shard_311.bin new file mode 100644 index 0000000000000000000000000000000000000000..7fd5e424dd34d905e4ebcf455948d84f1214f26f --- /dev/null +++ b/params_shard_311.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6318478c2f7334148f5681cabc8d1b858b5de9fd216be329f25e50361d860e5c +size 33587200 diff --git a/params_shard_312.bin b/params_shard_312.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7df316cb601a6c2ec9804937c44aeab67b823cc --- /dev/null +++ b/params_shard_312.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e7dd2e0c4bfbee1c1fb7dda1bf113fcc31a8af189fe4d2ac570fa1f6b7721f +size 26869760 diff --git a/params_shard_313.bin b/params_shard_313.bin new file mode 100644 index 0000000000000000000000000000000000000000..53cfc2dafff6f279c9ccbd4e057866c8d7751e44 --- /dev/null +++ b/params_shard_313.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951a664887743193157c1322ef3f233ab850e35399ca347b17024592675b451d +size 93978624 diff --git a/params_shard_314.bin b/params_shard_314.bin new file mode 100644 index 0000000000000000000000000000000000000000..288c8f2f07bc739fc7a513540c8cb58961215d22 --- /dev/null +++ b/params_shard_314.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f51e2aedaf4fa38d545a4e7d2fa4adda9eb963a9624dc37573fd23ff5ac4948 +size 30269440 diff --git a/params_shard_315.bin b/params_shard_315.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd5a7b07c567b291f8686639714d80d3c6e2a891 --- /dev/null +++ b/params_shard_315.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:907b0792188e56c3b257fb666a910c80c3e02437c98393912b9b2cb623ae7901 +size 93978624 diff --git a/params_shard_316.bin b/params_shard_316.bin new file mode 100644 index 0000000000000000000000000000000000000000..d87243f5950df31ae98dd20ef3e3d145a525f0d9 --- /dev/null +++ b/params_shard_316.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ec318dc958c6aa19004f8778e179788882f4f0fa50cca4f5898fcff1f5cdc4 +size 188088320 diff --git a/params_shard_317.bin b/params_shard_317.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ce6a02c6ec4736fcba921ab322dd7ad4321c251 --- /dev/null +++ b/params_shard_317.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd43b2ee127278efd3adb54d0bc4f495ae742a8f1c4727a9641dfa9d67f5d91 +size 23511040 diff --git a/params_shard_318.bin b/params_shard_318.bin new file mode 100644 index 0000000000000000000000000000000000000000..91748936a127b82967c6977d727887ee137cb2ce --- /dev/null +++ b/params_shard_318.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d890d9f87fcce93d9b56e20df33cfc5bda43e9f9bdf9792a5e978bd69676dd45 +size 33587200 diff --git a/params_shard_319.bin b/params_shard_319.bin new file mode 100644 index 0000000000000000000000000000000000000000..87caebaea7aa1ab8135fae6996b46380acd057c9 --- /dev/null +++ b/params_shard_319.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7198fc9056448beda8fb43e3dff254ac52f1a08d5408d3aa9d610a42b97470f +size 26869760 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a6603d5937059a317bc21312e4ec0fa81f020c1 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f3fbee00edeb8af62cf6d16b78222e259d25f6d28b0d06b3f6dad31004f244 +size 33587200 diff --git a/params_shard_320.bin b/params_shard_320.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a84043036ec8696ff2f418e9e36efe213b883dd --- /dev/null +++ b/params_shard_320.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d9244195fe8c8d519a6bbd7cd2078fa087d334ee82950c5b04689911bf7f43 +size 93978624 diff --git a/params_shard_321.bin b/params_shard_321.bin new file mode 100644 index 0000000000000000000000000000000000000000..667ffb2ef5520ae91cac8696cecf956333c22c70 --- /dev/null +++ b/params_shard_321.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15df41dea6830d3f38b10cf9ed9edd4064b46664fa3ba8929788f2a0f6c96343 +size 31117312 diff --git a/params_shard_322.bin b/params_shard_322.bin new file mode 100644 index 0000000000000000000000000000000000000000..00ca0b118992259ba542e83e6f1d8baa262ceebf --- /dev/null +++ b/params_shard_322.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aec44633e3f69e6639f698eb627145bc118a7c215f73d5b73c4c49e5aed729b +size 188088320 diff --git a/params_shard_323.bin b/params_shard_323.bin new file mode 100644 index 0000000000000000000000000000000000000000..15314415e4d2c87cb37a12260cb13901d218008a --- /dev/null +++ b/params_shard_323.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b73026a20ea4afac853e0fede8f966145fa4739b9df4c70b4737a0ee6c7c17 +size 23511040 diff --git a/params_shard_324.bin b/params_shard_324.bin new file mode 100644 index 0000000000000000000000000000000000000000..a48b4a65c63a0d5b7265f76a9d6e1d9facc55de7 --- /dev/null +++ b/params_shard_324.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccf6924e486bed1d3eb5fd5e7c4788a192f537ceac649f7d28935bc66fa6a49 +size 33587200 diff --git a/params_shard_325.bin b/params_shard_325.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d64e3e944e65156080fc7faf7131158a9338606 --- /dev/null +++ b/params_shard_325.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4793df065d7493d4e048b0f926d528eec6e969b6b140203b9c588915eeb072 +size 26869760 diff --git a/params_shard_326.bin b/params_shard_326.bin new file mode 100644 index 0000000000000000000000000000000000000000..829c863edaa9d3bc807ce61e539a9dcf1a2ff01e --- /dev/null +++ b/params_shard_326.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51233ead2594a674b55c7a484550d14ab744011deab65ab19196bd161a17fbbb +size 33587200 diff --git a/params_shard_327.bin b/params_shard_327.bin new file mode 100644 index 0000000000000000000000000000000000000000..4526015cb8b2b196d29d825523f01d7f90125ff7 --- /dev/null +++ b/params_shard_327.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:357e7d6db939152dd9c9d6f3ec0e2c8f4e0fa78896e44fc36e652871f798f6ac +size 26869760 diff --git a/params_shard_328.bin b/params_shard_328.bin new file mode 100644 index 0000000000000000000000000000000000000000..672a689a7c3cbb0bb8d9b55a2cb795553a2daf4d --- /dev/null +++ b/params_shard_328.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b50242b0ebe04240a7fa9607902229b3c35c627ffb2222ceb71dfc6991de4d1 +size 93978624 diff --git a/params_shard_329.bin b/params_shard_329.bin new file mode 100644 index 0000000000000000000000000000000000000000..eeba7ab228269c1f506f5732a6c4911143c8b965 --- /dev/null +++ b/params_shard_329.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9d11487c6f111322e57b38c26d950a2f73078e9db89d10696884c6e9afc868 +size 26894336 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..68777680248af6869575c4360f48220d427e0550 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:480841ece1451d189db9739e3a7a79f3d10029143b79f22c14c2d3563834e0dc +size 26869760 diff --git a/params_shard_330.bin b/params_shard_330.bin new file mode 100644 index 0000000000000000000000000000000000000000..1836a4b89f0e38901ca09bd41ec5e64eedea7316 --- /dev/null +++ b/params_shard_330.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42bcc84f6dc5f98eaf0ceae041f1784a16bbec228e85a0dfc481256921aabffe +size 188088320 diff --git a/params_shard_331.bin b/params_shard_331.bin new file mode 100644 index 0000000000000000000000000000000000000000..23f811e16820808081babf0c01298799634b5ed3 --- /dev/null +++ b/params_shard_331.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87117df2823a44ab86530f9cb0fbdc4753dd61a0cc460c894f814e297ddccb30 +size 23511040 diff --git a/params_shard_332.bin b/params_shard_332.bin new file mode 100644 index 0000000000000000000000000000000000000000..647c3070a121f29ebf948a96eafb4964bcb895f5 --- /dev/null +++ b/params_shard_332.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef164afd75cfd440c3010c9be5c2b7ee62b28588a14dac2301f0300c50746cd +size 93978624 diff --git a/params_shard_333.bin b/params_shard_333.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d9ce6106fa81221637730975521c2a821a90a1f --- /dev/null +++ b/params_shard_333.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8497c96eb6710cdb431efb31a0fae64b27116a4d4f7eb8c2c5d31c722a88c3 +size 188088320 diff --git a/params_shard_334.bin b/params_shard_334.bin new file mode 100644 index 0000000000000000000000000000000000000000..0517ae9f7be5705030dd178a806445b87392a92f --- /dev/null +++ b/params_shard_334.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44166b05bc0c17177ad3742a789ce127a5babd9d47213447d603def65384094f +size 23511040 diff --git a/params_shard_335.bin b/params_shard_335.bin new file mode 100644 index 0000000000000000000000000000000000000000..713fc87dd4a3bd5c2f4c39d3fa18118de1c21995 --- /dev/null +++ b/params_shard_335.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fa8ac022b7b6b34ed8f49638eecad88708180e69bf63a6a707aee78e9a5a03 +size 33587200 diff --git a/params_shard_336.bin b/params_shard_336.bin new file mode 100644 index 0000000000000000000000000000000000000000..87d486c53e3cd3e6d0a647e64f8865802532d667 --- /dev/null +++ b/params_shard_336.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85063f1cc7fb2421b146b8e74949cea7d408e3a81b1caaac27ffae8c1f507d26 +size 26869760 diff --git a/params_shard_337.bin b/params_shard_337.bin new file mode 100644 index 0000000000000000000000000000000000000000..c92330893425aa7b4357063efdae9b9551181f71 --- /dev/null +++ b/params_shard_337.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:658b451131f7780b1af6f09a7adfeb4eb144d8f62a56b9636667560fa8314229 +size 93978624 diff --git a/params_shard_338.bin b/params_shard_338.bin new file mode 100644 index 0000000000000000000000000000000000000000..93ca1adb12d71c94c5efc0b6df993a48e743975f --- /dev/null +++ b/params_shard_338.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408f898761623f70d1dd79ba266a161675b05ae80e7d70ac9f9c6fa608174610 +size 31117312 diff --git a/params_shard_339.bin b/params_shard_339.bin new file mode 100644 index 0000000000000000000000000000000000000000..78bae606a044eb51e59427b50173e35c76b9e063 --- /dev/null +++ b/params_shard_339.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2b118d2c19034cd31bc67161ec8f5e167e63531128b514366a609c763ff692 +size 188088320 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..61ba5557f87b2fef59c512ea81b7ff1c56f43a31 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f8d090bba7947ee197aaf1f18208a6b59cb17c97caeef7a18ad2b69f3366e5 +size 93978624 diff --git a/params_shard_340.bin b/params_shard_340.bin new file mode 100644 index 0000000000000000000000000000000000000000..caf0b11ad197eae6f12eaceb3e376294ef7c1f4a --- /dev/null +++ b/params_shard_340.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a53d7d71a05a9e26dfcf116a78515facf0147d6c1af70a5cb6ab06567f573d +size 23511040 diff --git a/params_shard_341.bin b/params_shard_341.bin new file mode 100644 index 0000000000000000000000000000000000000000..87c4bc7ef889a58626847a32ac4fcb77857e58de --- /dev/null +++ b/params_shard_341.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321fa8299afefc40813558c04b08f21954391d297af94f64a5126d37d320499d +size 33587200 diff --git a/params_shard_342.bin b/params_shard_342.bin new file mode 100644 index 0000000000000000000000000000000000000000..d502afbc209b0d6b627b554b6d104e5fdd70be9d --- /dev/null +++ b/params_shard_342.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05efcc0d16b458137e76ebec1180a0e25ab5f25694d1a20cc359e15da851cbab +size 26869760 diff --git a/params_shard_343.bin b/params_shard_343.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2f3774aa59af1f05ebe626e2767a557206e120d --- /dev/null +++ b/params_shard_343.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1ccf1419711f152d0e22bc0529f0114c8d868ce2ae6a0fc771b23c9d8c065e +size 33587200 diff --git a/params_shard_344.bin b/params_shard_344.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ed6c49f0da86f90cbd7cb89ec2ec80409b34bb5 --- /dev/null +++ b/params_shard_344.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2349791d66090f0439d92da2c3cfe2f5d27675086a0642cb9650b30797ce575 +size 93978624 diff --git a/params_shard_345.bin b/params_shard_345.bin new file mode 100644 index 0000000000000000000000000000000000000000..d07c5becd1de397a19116297eb37b4d3d0b61555 --- /dev/null +++ b/params_shard_345.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b47776da13ea3fef331da83e58822792582eae5473d913da481407597a0f2a +size 23535616 diff --git a/params_shard_346.bin b/params_shard_346.bin new file mode 100644 index 0000000000000000000000000000000000000000..0825dc42d27e869d31bd12dfaa36d107196a6e06 --- /dev/null +++ b/params_shard_346.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2bdea47d82b0bec9e9da19fd57b2e0c44aac05a3c41a05b05beb6c43077628 +size 188088320 diff --git a/params_shard_347.bin b/params_shard_347.bin new file mode 100644 index 0000000000000000000000000000000000000000..e622f0c301d3f829aeec2c2cf7b23ced2c5abad9 --- /dev/null +++ b/params_shard_347.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3631010bdbe6d349f5e22e8a587e732ef739fe41a0881b9a1c10cec09dc434fc +size 23511040 diff --git a/params_shard_348.bin b/params_shard_348.bin new file mode 100644 index 0000000000000000000000000000000000000000..45bea1de9097f4c5f38253bd6b821a29133876e5 --- /dev/null +++ b/params_shard_348.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8a78f5a47300b7b60b660dbdc3e287b1370c802e5f524103dee0c4dd592a8d +size 26869760 diff --git a/params_shard_349.bin b/params_shard_349.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a04a542ebd291fff1582ca5f847b38ff4266d98 --- /dev/null +++ b/params_shard_349.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f263add1ac209809de080d995b8b8703442da7ec2e7489e509d55f355afddf1 +size 93978624 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..0af564533728f9abdef4bbc6ed44ba9969372537 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8ff94e6a270925c43fe2aabc791d1da606664b6064ec75ae75cc3738ae654b +size 188088320 diff --git a/params_shard_350.bin b/params_shard_350.bin new file mode 100644 index 0000000000000000000000000000000000000000..e56373e4f6da52c4a6a592852e2a4881a5fc995f --- /dev/null +++ b/params_shard_350.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc84fd795106ff200e4fa3a855a6609f4db8e2fd59521ed83e0c08af562f49c8 +size 188088320 diff --git a/params_shard_351.bin b/params_shard_351.bin new file mode 100644 index 0000000000000000000000000000000000000000..85283fe9500ab9a10d3fcc6852a3cfe2de700fb3 --- /dev/null +++ b/params_shard_351.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18fdcbfa592cd05c48dd4c91836970ee2e222cc0b3fac0980fb3b3204bc4565 +size 23511040 diff --git a/params_shard_352.bin b/params_shard_352.bin new file mode 100644 index 0000000000000000000000000000000000000000..4032457f4c8b6e50f0bf038ac885c6f3275c6932 --- /dev/null +++ b/params_shard_352.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c2a43792336cbe453e73186017a63befa3021dcd490007456221b90d838796 +size 33587200 diff --git a/params_shard_353.bin b/params_shard_353.bin new file mode 100644 index 0000000000000000000000000000000000000000..99398c4c1f527f3707ab4b1bb7a89d05ae2d1251 --- /dev/null +++ b/params_shard_353.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af39246177a3859b7a7797132128c1349d96f6521d34a6e663e6a9f73682f6d8 +size 26869760 diff --git a/params_shard_354.bin b/params_shard_354.bin new file mode 100644 index 0000000000000000000000000000000000000000..37d701783a55aa75b28e7409dd385c4e4df69735 --- /dev/null +++ b/params_shard_354.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:356bf60073b8e6c189f91e801a34866e93e5e0b3a23df033e0e7cc21fba28d7c +size 31100928 diff --git a/params_shard_355.bin b/params_shard_355.bin new file mode 100644 index 0000000000000000000000000000000000000000..88f19b7f4b5e49abd594baf81458f1fc20bff369 --- /dev/null +++ b/params_shard_355.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b942c9f1783be9b266dd9e3597b6472ad4de2cf30042a5de410e8857a4a17c +size 93978624 diff --git a/params_shard_356.bin b/params_shard_356.bin new file mode 100644 index 0000000000000000000000000000000000000000..e9a4e3068ef719144bcee2fa6ac7bbbf816825ab --- /dev/null +++ b/params_shard_356.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0843e671ecb362285c02f5a8a89d79846fa2005a1fc9bba61687712d95d66df8 +size 188088320 diff --git a/params_shard_357.bin b/params_shard_357.bin new file mode 100644 index 0000000000000000000000000000000000000000..24f5d16f6b95880ea796625bab44f6eb05320185 --- /dev/null +++ b/params_shard_357.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8f66e7aaa833e4ee71f0164d95cf0f853e22ea5a20a1107afd5406a57863d4 +size 23511040 diff --git a/params_shard_358.bin b/params_shard_358.bin new file mode 100644 index 0000000000000000000000000000000000000000..e80e96f6a4d61dc87c9c259ba7dfb48e08e34350 --- /dev/null +++ b/params_shard_358.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29eff08636dde18dc6db06134ccf8060a2abf518c01984e4e4df2805ee4ae69 +size 33587200 diff --git a/params_shard_359.bin b/params_shard_359.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa45859bd1aa097c5cf6e33f3d93c078fb476e1a --- /dev/null +++ b/params_shard_359.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e35e09fd524957fa8c5ca02ae863431fa2aeb950b82f448410359eb28f64b4df +size 26869760 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3d63a9821a877f4467346fbc7fcc6886c682507 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2dfb194b2f6dc03b2b84809596d99aefa910bcc63743ea8593b48c6eb9ab61d +size 23511040 diff --git a/params_shard_360.bin b/params_shard_360.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b79caa5f76c4e49299503a140724c5c4024abf4 --- /dev/null +++ b/params_shard_360.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c161752a09adf09b2997860f327743032cad22e1461d7d38481c09933b433d18 +size 93978624 diff --git a/params_shard_361.bin b/params_shard_361.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8027f43015107522c7ca946a016296981a822c9 --- /dev/null +++ b/params_shard_361.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d760b3f17e3dc47184483855ec42df737bfcd6fd97e75ec370531a49bcfd5566 +size 22712320 diff --git a/params_shard_362.bin b/params_shard_362.bin new file mode 100644 index 0000000000000000000000000000000000000000..400e3a649133ba419c0632e0e87c951f3ef1bb79 --- /dev/null +++ b/params_shard_362.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff7840f14ff2444c84a3019d550dd16da636fe8e6b98d3b9f3693d4475b76e5 +size 188088320 diff --git a/params_shard_363.bin b/params_shard_363.bin new file mode 100644 index 0000000000000000000000000000000000000000..b26d835182b47d548042101c20c3de9a6e9beea2 --- /dev/null +++ b/params_shard_363.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d021d79d004ff083182c432156e1421a02f0e9316499887ec68e16e938ab07 +size 23511040 diff --git a/params_shard_364.bin b/params_shard_364.bin new file mode 100644 index 0000000000000000000000000000000000000000..150016aa8e795e711c64875816d297c99e0016f9 --- /dev/null +++ b/params_shard_364.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7b84b9f6e33709333acbf0c62bb95c1c8c70643bd82d7cecaba118e2ddca08 +size 33587200 diff --git a/params_shard_365.bin b/params_shard_365.bin new file mode 100644 index 0000000000000000000000000000000000000000..6866f0a2934d06e1d73b5c8d2d8fbfad259b4dbe --- /dev/null +++ b/params_shard_365.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f1638cb8cca0a755eb73c14a77e13af693120f7e57fc11fea9a3599c7cca8c +size 26869760 diff --git a/params_shard_366.bin b/params_shard_366.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac721aecab543e3152ddd850bdc1fff7c03b1f6e --- /dev/null +++ b/params_shard_366.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0ad8e9eadfe891a452ca3bd0be928e753be51934281bbd07de0db2adea7d98 +size 93978624 diff --git a/params_shard_367.bin b/params_shard_367.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6924722f79ba12ac34bd1a15beb4f008fb27643 --- /dev/null +++ b/params_shard_367.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b174bcf1a7212dc1b4748d4bb53b29b88fbe5244fb3c1f0ecc2e997d93fef0b +size 188088320 diff --git a/params_shard_368.bin b/params_shard_368.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c3a6fe923443dbcbf2a8e9350d6309df92c8044 --- /dev/null +++ b/params_shard_368.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9600adc63fc83663e12b50f10dccd6d86c2966b5c7cef900b46c8c07fce1b2a8 +size 23511040 diff --git a/params_shard_369.bin b/params_shard_369.bin new file mode 100644 index 0000000000000000000000000000000000000000..549291d12c39f7468246ce7231789e044a974d72 --- /dev/null +++ b/params_shard_369.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6697cb1cf48d6abee467fb017bbf1fe45a73ebbc825e887adee2d7b72e3072 +size 33587200 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..50215d274644b03d5eea208620c2a49c41d70778 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab15dfad9ca45770ce280c75eb3950938b294405c6d937d54bafe3a450fc73c6 +size 33587200 diff --git a/params_shard_370.bin b/params_shard_370.bin new file mode 100644 index 0000000000000000000000000000000000000000..66a8d8052a9c082225fb819e7f51afc609750344 --- /dev/null +++ b/params_shard_370.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed0aac776a1e3d4506aa5b05136e2be79c542b718208b063368c125c42c0c72 +size 31100928 diff --git a/params_shard_371.bin b/params_shard_371.bin new file mode 100644 index 0000000000000000000000000000000000000000..c742d94f6e6032e20cf25147a405dc7e2435ff9b --- /dev/null +++ b/params_shard_371.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e2028d2473cb79581c33d685c390c8cb44dcf06247c0f948f7c4b3ba04138ce +size 31068160 diff --git a/params_shard_372.bin b/params_shard_372.bin new file mode 100644 index 0000000000000000000000000000000000000000..14217391cc021799000b211c7eb601ac489b9eed --- /dev/null +++ b/params_shard_372.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255c379296aa81a75ce4039ea3b346cde5fb48c1245cdeb16b0d3a41dec78915 +size 188088320 diff --git a/params_shard_373.bin b/params_shard_373.bin new file mode 100644 index 0000000000000000000000000000000000000000..708a84cb1e6774a250e5ee8d40bd72a46ffa65eb --- /dev/null +++ b/params_shard_373.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7345a1a655d2296b72016e46927abc359b5355c2ed6d61a4e5a4c9ce8b3a25b6 +size 33587200 diff --git a/params_shard_374.bin b/params_shard_374.bin new file mode 100644 index 0000000000000000000000000000000000000000..aedccca7ffd6bd0874a6bbe2597eceea159e60d2 --- /dev/null +++ b/params_shard_374.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df341a59371186dd6ec0683c44e54ac5dcb986a1dff99d164139ede9a21721d8 +size 26869760 diff --git a/params_shard_375.bin b/params_shard_375.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef779b916921746764d4f7e339de3e5d317ceb27 --- /dev/null +++ b/params_shard_375.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491663922156b786da4b57824de49a57d377dfef4763c4ed402a8a6223c70b8e +size 31068160 diff --git a/params_shard_376.bin b/params_shard_376.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f30ebcbfb6912874c8fcc0a3cc668ec8eb04213 --- /dev/null +++ b/params_shard_376.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033f04921c10a48443b8bd8c43bb9d288a80d2971f44215f9e3a3b043a835483 +size 93978624 diff --git a/params_shard_377.bin b/params_shard_377.bin new file mode 100644 index 0000000000000000000000000000000000000000..3737a041b9e52e3e469ecbf5277915728617bc1f --- /dev/null +++ b/params_shard_377.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd6ccc5d87ac56ce5d133c90808a21a10c3a79b37dd4cfbf0fb1c6b63fd88dd +size 93978624 diff --git a/params_shard_378.bin b/params_shard_378.bin new file mode 100644 index 0000000000000000000000000000000000000000..bef35b12456f9240e621484049a57fd02507da5d --- /dev/null +++ b/params_shard_378.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f25ada1592ce0969fe41b0a97f9e85b9dd5905529bcf1b4ceaf7d460f4ec9ad +size 188088320 diff --git a/params_shard_379.bin b/params_shard_379.bin new file mode 100644 index 0000000000000000000000000000000000000000..b952670fd8241ed622c787cfd323e4175e539df5 --- /dev/null +++ b/params_shard_379.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1f52f7e43d57949874119335d49c90bb0dac0c55d46da108397924bf46b6e44 +size 23511040 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..330baf8a43b6cbe1d967007743e5fe0bb518e8e1 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddfa7ca16c3729f119f4093e264e773b82a74559fb574e8ed5e83a9e23d1f9e8 +size 31100928 diff --git a/params_shard_380.bin b/params_shard_380.bin new file mode 100644 index 0000000000000000000000000000000000000000..320ce0c02377d340e7277c61280ab53dca0b514a --- /dev/null +++ b/params_shard_380.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b15b51a74b1f39a3e23c4556980bc8d40d7e14b23b235f7972cd2b6459a54d9 +size 33587200 diff --git a/params_shard_381.bin b/params_shard_381.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4740d2a658f4cfd6abe8c4c5070067303b75df3 --- /dev/null +++ b/params_shard_381.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a0bcaf865e51ee1ced06566ba867d57dd918fc3bda35c8841501ad501e6923 +size 26869760 diff --git a/params_shard_382.bin b/params_shard_382.bin new file mode 100644 index 0000000000000000000000000000000000000000..730c09d1ff51d582399478429b47b9e6985a2787 --- /dev/null +++ b/params_shard_382.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cabd3abbb8030cf36221bd47e368be98bc12fd3eb4d7914a9ab10ee0aca45360 +size 31117312 diff --git a/params_shard_383.bin b/params_shard_383.bin new file mode 100644 index 0000000000000000000000000000000000000000..5131dcb5a52c368d80352369264e027c442065a9 --- /dev/null +++ b/params_shard_383.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc3287dcfeb0248785f73554ccba7ba3411ebb90cb87596e191e5294a8de4f5 +size 93978624 diff --git a/params_shard_384.bin b/params_shard_384.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb2d1ed48acecb72ee9469589425f12e6632a5a5 --- /dev/null +++ b/params_shard_384.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d283c6fb8ce401688fb65a22bd41bd6e8eb8c79820ef7376e5ea17db3b661926 +size 188088320 diff --git a/params_shard_385.bin b/params_shard_385.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b982e25fff0cef493991658336ecadb59636aac --- /dev/null +++ b/params_shard_385.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98df3549bd4e00ee5ab764ecf0304da53914cd85920bcaabcbb5adc86eeec828 +size 23511040 diff --git a/params_shard_386.bin b/params_shard_386.bin new file mode 100644 index 0000000000000000000000000000000000000000..bde4807aeb8418ed7ce625c2505bc8dfc7a5fcc0 --- /dev/null +++ b/params_shard_386.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb70f64dfdac09f725ea774fce3fe78eb586bdd09f02605695c03ec8f7c7ec19 +size 33587200 diff --git a/params_shard_387.bin b/params_shard_387.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0f4717bd6ff60649717c435b5ffd380757ff572 --- /dev/null +++ b/params_shard_387.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:812a9dd41dc423ea221d5978991a239ef6c9cefe404df5e2c049937eac7eda00 +size 26869760 diff --git a/params_shard_388.bin b/params_shard_388.bin new file mode 100644 index 0000000000000000000000000000000000000000..51b105764396dbc7114fe4790fe67e70e1b1f423 --- /dev/null +++ b/params_shard_388.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2715aa4847671bc1794d78f56be04f5a28aeb045b1b0ca69723166c4409d6e7 +size 188088320 diff --git a/params_shard_389.bin b/params_shard_389.bin new file mode 100644 index 0000000000000000000000000000000000000000..19723fa5d90e8b08dcdacf1d4793f786856f1734 --- /dev/null +++ b/params_shard_389.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d58581cd9b00a4c3f5b17180c73ca1e70843ba17e995af236dff7be94c508a3b +size 23511040 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a3dfcaf0dea8f8612e0ce560632be885a6879a1 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf365cdcd9fbf1d0b5f1345329689890c8ef8ec801beb1f970bceecb5ccc940c +size 31068160 diff --git a/params_shard_390.bin b/params_shard_390.bin new file mode 100644 index 0000000000000000000000000000000000000000..162209844184d41445b2f9fcdbf8675aacb2816b --- /dev/null +++ b/params_shard_390.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e8fab2fc1b876133602a5b6336c6a30267d42f399d996163f6a148899651c4 +size 33587200 diff --git a/params_shard_391.bin b/params_shard_391.bin new file mode 100644 index 0000000000000000000000000000000000000000..38c14238135e750eaf5c0ee3dd1fd6ba0c504589 --- /dev/null +++ b/params_shard_391.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae727f3ddafb520a5b6beda10350d4c15a825b1d62531999da12520c16861e9b +size 26869760 diff --git a/params_shard_392.bin b/params_shard_392.bin new file mode 100644 index 0000000000000000000000000000000000000000..73a4a0cfb2cf8964f2e5156937cf650953354d1e --- /dev/null +++ b/params_shard_392.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3934c5b6651f82ba67d6e7d991d28443eff049dcfdb87ab1c3642b515657fabe +size 93978624 diff --git a/params_shard_393.bin b/params_shard_393.bin new file mode 100644 index 0000000000000000000000000000000000000000..5510997ce8b8be09b9a5bb5100985b87f85ce570 --- /dev/null +++ b/params_shard_393.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea799d7c0b63dc8a0aab4f48a5ce74468bd3ae5e83bd7408cfa31ec9067e3c6 +size 30269440 diff --git a/params_shard_394.bin b/params_shard_394.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef0ca43494637686386980028bac6df7c2ba2c5b --- /dev/null +++ b/params_shard_394.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6abf234852d792587d802fe823d20a2ea89705a831d3d46f4cb1c15963ede6ca +size 188088320 diff --git a/params_shard_395.bin b/params_shard_395.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e1bee8b83b71c520a2e5dc7d5331af8398ff3b2 --- /dev/null +++ b/params_shard_395.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c792f2a9bb3c199496a4a258e428ccd592f7d5487b01fcfaa1e7cbd93adc39 +size 23511040 diff --git a/params_shard_396.bin b/params_shard_396.bin new file mode 100644 index 0000000000000000000000000000000000000000..e920950c5cc06cdde96e9a816450040be73de723 --- /dev/null +++ b/params_shard_396.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbcb52c9edb12cb864fe9796fe5d61e475613bb757a5c22ba18b9781c8001cea +size 26869760 diff --git a/params_shard_397.bin b/params_shard_397.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f6e0614e13eef8c72300acc34d148f957182f2b --- /dev/null +++ b/params_shard_397.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f823f7838784615ca38ffb40dd9250b969b931c46ef7c5caaffcbd7ada306d9 +size 93978624 diff --git a/params_shard_398.bin b/params_shard_398.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc2780c9d1cc6c416ae752e356a161e543411875 --- /dev/null +++ b/params_shard_398.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17770aa27d06a06afff491567ad96d5f86a9ef928076a0a9da46b541005d3931 +size 188088320 diff --git a/params_shard_399.bin b/params_shard_399.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e36281a35d31c450e32738e386a1fdbe31e4547 --- /dev/null +++ b/params_shard_399.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f4229c4c40d92cfdb9ca53cbde87495559ed0eff614165b0090b5c8982b46a2 +size 23511040 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b139cd4f5d03065847486a4c21ab400605ddd40 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb73cff9ca505f23c0295f9eda0375d1c102fa2c6afd99779a4bd3664cdff04 +size 93978624 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..c004d33d75511f4ec6ca7fc877d661b37eb3afa6 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed7e8d1e40141dcfc61df27fb4776680cdddb2ddd0fc9de8caddb1f191e3116 +size 188088320 diff --git a/params_shard_400.bin b/params_shard_400.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c1ca10eca676c93387e7c48b216888584bbbbc1 --- /dev/null +++ b/params_shard_400.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d1554e106ff24d87bf958aa751cd9a9bcb3e17161ae2b37b062def267432e7 +size 33587200 diff --git a/params_shard_401.bin b/params_shard_401.bin new file mode 100644 index 0000000000000000000000000000000000000000..d39826ca721dd2f84c73498437d174aec543caa0 --- /dev/null +++ b/params_shard_401.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800601997997c919292d20333968f6b9ede19faf4243f7c58e4af2e4ea755dc1 +size 26869760 diff --git a/params_shard_402.bin b/params_shard_402.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1fc4ff8e2752b620938f840ff47cef82e7d8a59 --- /dev/null +++ b/params_shard_402.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cdf084ddd203602b0e2aa1e845261c8c2a7acf85f480eb29104845778e07bf1 +size 31100928 diff --git a/params_shard_403.bin b/params_shard_403.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0fa5ee65fabcbe0ef45b9024149cd1a413dcf64 --- /dev/null +++ b/params_shard_403.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:285c327b9ff0da9510e6d5a425784feb1c5e98bf6a1b26eb5722725936b843cf +size 93978624 diff --git a/params_shard_404.bin b/params_shard_404.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5cee2e28fc398e5c835e247a6dddc501a8bddd1 --- /dev/null +++ b/params_shard_404.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3861b679fa504097ad99f768f06b9aab72b99edb4c7f5b0cef579a1d2b29b5 +size 188088320 diff --git a/params_shard_405.bin b/params_shard_405.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5587a0f0a15518319955bdd02ea01f946520957 --- /dev/null +++ b/params_shard_405.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f22b0320d53d62206bd7ab538f96d28b3b32a6f4c1af24d02acf5c9935a7a7 +size 23511040 diff --git a/params_shard_406.bin b/params_shard_406.bin new file mode 100644 index 0000000000000000000000000000000000000000..34b0d0cb44910004f53bc869864bf18f28de34e3 --- /dev/null +++ b/params_shard_406.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90be05d811e923ad1e77e7266902bc5a28b51e4bd4ac2d22322d9b79ad95cbb8 +size 33587200 diff --git a/params_shard_407.bin b/params_shard_407.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca94579e1b061be46abc55bb083ceadb5bb3e9b2 --- /dev/null +++ b/params_shard_407.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:001f3490e4cb7b5e7aa1bcaac82cf175fb88d2dbcc8621faf6b8e85d50b1c7d5 +size 26869760 diff --git a/params_shard_408.bin b/params_shard_408.bin new file mode 100644 index 0000000000000000000000000000000000000000..fab308466105f4db1941aa992fcee5e745922620 --- /dev/null +++ b/params_shard_408.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae171af80a146937549c5a2776bfdb2ebf6679c9e7da9d3a8260904217cfcf9 +size 93978624 diff --git a/params_shard_409.bin b/params_shard_409.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab9a5c7293528689e5c0ef146c4dc998e44ab64d --- /dev/null +++ b/params_shard_409.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf9b64fce77d5e007bc8a75305db4250da4859a927d5ffb766bbf8f8f3f3bc1 +size 22712320 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..88fe9b50f223a79abeb7e01b2ea4fe74fd1bc5ec --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38048c0e41786c8d107c3162982414d57f6a90a690b625eccd149e56d0952dbf +size 33587200 diff --git a/params_shard_410.bin b/params_shard_410.bin new file mode 100644 index 0000000000000000000000000000000000000000..30d208c41f8d87074414c0c4005e82cb8d49825b --- /dev/null +++ b/params_shard_410.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f566a1d911cf5895e927113a9167743b177cb1dc1df9b0e938464982d8ceae3 +size 93978624 diff --git a/params_shard_411.bin b/params_shard_411.bin new file mode 100644 index 0000000000000000000000000000000000000000..53c0d8d82949a3dd8a5355cfea4503a7bf74d03c --- /dev/null +++ b/params_shard_411.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f82bfaf750ec914e766f6fce926354c52bc68cc6f2b8511a5c59839226b063 +size 188088320 diff --git a/params_shard_412.bin b/params_shard_412.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6968973dba2219a98b5c280505d81b0edec1470 --- /dev/null +++ b/params_shard_412.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5c75558b65b38f343548e99b92d62b19e79143aa9edceb176fc1207a2722da1 +size 23511040 diff --git a/params_shard_413.bin b/params_shard_413.bin new file mode 100644 index 0000000000000000000000000000000000000000..1777c7d914348b2fd1fd3d3279bdf0638daa68be --- /dev/null +++ b/params_shard_413.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a68b31ccddbbc740cfccac65d06587644a10c1ef191ab20c253b869b7af5c25 +size 33587200 diff --git a/params_shard_414.bin b/params_shard_414.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2acaf373ac0c03a31ab635430aa345b67ed4d10 --- /dev/null +++ b/params_shard_414.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f855fd549bd1bceaab98fe557344a28dd4bc4fb1bc9cef59d2322f2aaa2d735e +size 26869760 diff --git a/params_shard_415.bin b/params_shard_415.bin new file mode 100644 index 0000000000000000000000000000000000000000..28ea549e5a3a7c3348b2f3dffbbe74035ccdc03b --- /dev/null +++ b/params_shard_415.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:046b831c0ef7dcb184efeccec12ac5b6df9f3b4d6c3f421d04b82c6e5dd694e4 +size 93978624 diff --git a/params_shard_416.bin b/params_shard_416.bin new file mode 100644 index 0000000000000000000000000000000000000000..e9af5a65a7f912cf9249c1e473ee1d93daee84a9 --- /dev/null +++ b/params_shard_416.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84fb1922d0af43367b397c12dd8196b76d1b96acbd02e8355278d5fd87c795f2 +size 31117312 diff --git a/params_shard_417.bin b/params_shard_417.bin new file mode 100644 index 0000000000000000000000000000000000000000..db1dfc96e7d26a00b886e0b9672d944389912ad3 --- /dev/null +++ b/params_shard_417.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b1f2b7317fdaa8b0ecf86a11534731b5b10dd5d6d131ad5888f21ec4d368b5 +size 188088320 diff --git a/params_shard_418.bin b/params_shard_418.bin new file mode 100644 index 0000000000000000000000000000000000000000..66336aafa56171dff2f756113b43ccf4a250b6be --- /dev/null +++ b/params_shard_418.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a5453055d2c49a1ed1ba66442861edb299270cbfd1886d4708097804197f70 +size 23511040 diff --git a/params_shard_419.bin b/params_shard_419.bin new file mode 100644 index 0000000000000000000000000000000000000000..136f837e312e0c02ef78179c873eaae4c3cb7906 --- /dev/null +++ b/params_shard_419.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56e14e2de8dcae6b18fd8cb68a2e7e81cbd699b2df91a54976bf6f73e16e2af +size 33587200 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..a33d341a2078fb42629918f8c5ef76cbd2a99c7d --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424b76b4f8a279571cd303dbe161819113858469f23f27d6a37476c9ed0a16db +size 26869760 diff --git a/params_shard_420.bin b/params_shard_420.bin new file mode 100644 index 0000000000000000000000000000000000000000..f99e4a6c9d77b12e99fdee4ae74e556116b6230e --- /dev/null +++ b/params_shard_420.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d4d62af42f063d50b3342f94c994ef1070a58082cd65b6efce08ce7cd6b789 +size 26869760 diff --git a/params_shard_421.bin b/params_shard_421.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4fbe85fab845aa26d014d95914e5d5126b9e371 --- /dev/null +++ b/params_shard_421.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b12a932841542a09b30292805106082513c4caf07f9aa316c781ff47b042c2 +size 33587200 diff --git a/params_shard_422.bin b/params_shard_422.bin new file mode 100644 index 0000000000000000000000000000000000000000..95a395a33ebcffcf75135cd6a88bde6625d16f1b --- /dev/null +++ b/params_shard_422.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36491a97a207d861d284f793f7e098f5c670aee5e78a08ec566138c2f5bc0bd +size 26869760 diff --git a/params_shard_423.bin b/params_shard_423.bin new file mode 100644 index 0000000000000000000000000000000000000000..f339723f1712c2b5516496cd159c4a2104114d7e --- /dev/null +++ b/params_shard_423.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5240d29065233966485228046979a54cfab24a5b5585ae767199684a04c47b6c +size 93978624 diff --git a/params_shard_424.bin b/params_shard_424.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f26eda38beeffc97c155eccee1315babd644380 --- /dev/null +++ b/params_shard_424.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa638564c83f7b78d267a52667e9958465ed669da2be91b7ce7c5e7357fe7384 +size 26894336 diff --git a/params_shard_425.bin b/params_shard_425.bin new file mode 100644 index 0000000000000000000000000000000000000000..081535443e3015dc1d1062fbf65b529fd73099b8 --- /dev/null +++ b/params_shard_425.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acbf9e825c91c4bf4ee5a957fdc00fa83e8547cd83ee6cedf3dfbeef6e052333 +size 188088320 diff --git a/params_shard_426.bin b/params_shard_426.bin new file mode 100644 index 0000000000000000000000000000000000000000..272be96b92cc885586d5eac64083ff36a30c0138 --- /dev/null +++ b/params_shard_426.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca5622c1d7950e6c5f42846dcc86674c0c6b99e08acb52f44d401934de52a39 +size 23511040 diff --git a/params_shard_427.bin b/params_shard_427.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c47919898ce3774be766096da97ffcfd46880f2 --- /dev/null +++ b/params_shard_427.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6e55fab6eb4bc2f9c505203a1ef953736ca0ebf58cf60650c93271ea4da31c +size 93978624 diff --git a/params_shard_428.bin b/params_shard_428.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a8e276813b2f2bb2d5aa16844c2003da093e837 --- /dev/null +++ b/params_shard_428.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21bc92ff50b74e1ec00f7879040498db95e6da0be5a9e9e1f75e12694c58059c +size 188088320 diff --git a/params_shard_429.bin b/params_shard_429.bin new file mode 100644 index 0000000000000000000000000000000000000000..47670ab3016813c30a6d699d99c208a577eb236f --- /dev/null +++ b/params_shard_429.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0093ccc1fcd5083411a4c8cd3d20c9a5de8d70769d594d1bbb1303c5a206278 +size 23511040 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..b582b54d1782ec1fba6b748fbbd5a151cc5a03de --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b7ca2b17bd0500a0fd8bc98a474f4381c67e92ab0f6da87fec96fc240e9d95 +size 31068160 diff --git a/params_shard_430.bin b/params_shard_430.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a2dba589c874a64c167bbdef9e19fce9cdfedf1 --- /dev/null +++ b/params_shard_430.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b17329a5e4e1f5df8ad56e2f6ad7ec52e7904c76ef2a7c561c93096cabb77af +size 33587200 diff --git a/params_shard_431.bin b/params_shard_431.bin new file mode 100644 index 0000000000000000000000000000000000000000..b04814bc46d0ae1ccbab2ba6b46bff1d6a599249 --- /dev/null +++ b/params_shard_431.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a63c9680c37262749e641ec14b2239d927723eeede6113487f072949031c419 +size 26869760 diff --git a/params_shard_432.bin b/params_shard_432.bin new file mode 100644 index 0000000000000000000000000000000000000000..575e593e0c6e8afd2624ba150202511268f819ee --- /dev/null +++ b/params_shard_432.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140b453f830e54048661c6122a6c965de8792f83f44d5a705499af06ac84b9f8 +size 93978624 diff --git a/params_shard_433.bin b/params_shard_433.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf4a5b8a4395c7a8c92a9df933d94e06ac422ce5 --- /dev/null +++ b/params_shard_433.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5913d6369efeff671c11eebeec75fa5be130098426284abe6c5afa1148ba352f +size 31117312 diff --git a/params_shard_434.bin b/params_shard_434.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7fe2fbf4d74d963e26c6ddf1ec5168810788784 --- /dev/null +++ b/params_shard_434.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb1122442ea35b1e1e6eb9eee5b975980d31a29e29dc3841aa60d0c3e5e1f9e +size 188088320 diff --git a/params_shard_435.bin b/params_shard_435.bin new file mode 100644 index 0000000000000000000000000000000000000000..86f932f018a6e15053b8488e5b00f396f68f80ad --- /dev/null +++ b/params_shard_435.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c6fd52eb324b7d8646b6c589761f82c5955959090b94a16c84b953c5146db7 +size 23511040 diff --git a/params_shard_436.bin b/params_shard_436.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2e5ec7c9497026e5daeeb0c0ece085c6d737e22 --- /dev/null +++ b/params_shard_436.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a114e27fdc9efae753b2f51d3daeaab4b0cb33def4dfabed85e1d22cdd13b7 +size 33587200 diff --git a/params_shard_437.bin b/params_shard_437.bin new file mode 100644 index 0000000000000000000000000000000000000000..256150b07db9cc0e9da9c6dfd1d83d8e42844926 --- /dev/null +++ b/params_shard_437.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da957006d6ccc912b204bbed89b7f9567053507b6663666c2b0620c8b640abf +size 26869760 diff --git a/params_shard_438.bin b/params_shard_438.bin new file mode 100644 index 0000000000000000000000000000000000000000..23ee011e49fec65b94a1067d6cdf989368c68ae1 --- /dev/null +++ b/params_shard_438.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdeae27a559bf3fce821fc34a7b03a7ee03383dbf26926cc791686a5274dc2ff +size 33587200 diff --git a/params_shard_439.bin b/params_shard_439.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b627872a7a7e1f965b26019c102a805284149fd --- /dev/null +++ b/params_shard_439.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45704f28ce207d96032ab822c7f150f92595eb31a9fda7d35922900488b0bea +size 93978624 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..282eca3286754ed66e0e98084c69f7a0b1e68248 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1079cf6bb3dd3ee56d422a3101fd1f8df67a026719e157ce1a8c1b4ae66648a +size 93978624 diff --git a/params_shard_440.bin b/params_shard_440.bin new file mode 100644 index 0000000000000000000000000000000000000000..379a2a544ace1ab91c653c3a77d6266844fbcda9 --- /dev/null +++ b/params_shard_440.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518c37f8fe377f98edeabb7e1d9bd9466eff8fd704fb5bbc4cc8db94a9a0c554 +size 23535616 diff --git a/params_shard_441.bin b/params_shard_441.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd810cd3b667971bedbb542b104ec1cdd4affb00 --- /dev/null +++ b/params_shard_441.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd34eb6855922546a37476ad21b9569b412e1b7db60f89d20776217cd5c283b0 +size 188088320 diff --git a/params_shard_442.bin b/params_shard_442.bin new file mode 100644 index 0000000000000000000000000000000000000000..484a3163b23bcf8223175bdc4d56c03391b19c08 --- /dev/null +++ b/params_shard_442.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93c3789517f2fc582f28ec536b3f7ccf6e05253389e1a4df94c46535b87bc6c +size 23511040 diff --git a/params_shard_443.bin b/params_shard_443.bin new file mode 100644 index 0000000000000000000000000000000000000000..301afab6cb03038421202048030e6f258b211810 --- /dev/null +++ b/params_shard_443.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1a654e3220f40921b49d9ca525270eed7d803e6eb39af56a00a21e1e134cb9 +size 26869760 diff --git a/params_shard_444.bin b/params_shard_444.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f93e6ddc7cb33108690410f7098ee32d1c9c11a --- /dev/null +++ b/params_shard_444.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983bbd83861f9121ebeb2b42813ed66845599f335e5e158710cd20371936b317 +size 93978624 diff --git a/params_shard_445.bin b/params_shard_445.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f62f312a4c23f2d7a992cfc9ee50e089bed40f4 --- /dev/null +++ b/params_shard_445.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b83cca3de4ad568840e49b253acb09e28a10fb369f0b4d8de48450000f452cc +size 188088320 diff --git a/params_shard_446.bin b/params_shard_446.bin new file mode 100644 index 0000000000000000000000000000000000000000..b88e20acc5b3fd9109b05d6850c7cadc2d2017cc --- /dev/null +++ b/params_shard_446.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ddb70be918cf49ac1709fcf8e5c7bb09911ea024aee02e1d4a6d8bc1082b65 +size 23511040 diff --git a/params_shard_447.bin b/params_shard_447.bin new file mode 100644 index 0000000000000000000000000000000000000000..5493ca278054e82653586efdc8267d710c3ebe2d --- /dev/null +++ b/params_shard_447.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80a3759488ec2ba86b64dc6c56b94127fdcf444c449549d4c73a8fba6dbdd64 +size 33587200 diff --git a/params_shard_448.bin b/params_shard_448.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f19c383e373ab90fc93d79175e666f3acacec84 --- /dev/null +++ b/params_shard_448.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f973edf27c29720841b98929bd216498adae657328a51fd37df15adaffacbc50 +size 26869760 diff --git a/params_shard_449.bin b/params_shard_449.bin new file mode 100644 index 0000000000000000000000000000000000000000..d00362fee0e60124765d6572651f03ef868b111d --- /dev/null +++ b/params_shard_449.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc0904483c9e39f3e4245a3975fbce7023d8057f2dd84124d01686b1f55773e +size 31100928 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0e1a4bf4c97fdfd677998e4dd8b7b93b9a99a2a --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18168fcb274078a5cb8f5098b4e0ede50d1fedd280f8c3a61a7a3cb2b0dec598 +size 93978624 diff --git a/params_shard_450.bin b/params_shard_450.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e5742b3771dda5705c9665ce3049693c4738813 --- /dev/null +++ b/params_shard_450.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7628555c85f828fd6779d9552ae57da31272adf1bb60c1227090dc40e7feccf8 +size 93978624 diff --git a/params_shard_451.bin b/params_shard_451.bin new file mode 100644 index 0000000000000000000000000000000000000000..95d649ecfdaa9c2809a0a22fe599bd0eea454ec8 --- /dev/null +++ b/params_shard_451.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fcfafcf316e9203709d77e242a214a62f91f79d9310a7f08ba5fbba69a123ae +size 188088320 diff --git a/params_shard_452.bin b/params_shard_452.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7fda86bccf56293aa279a418410a52715f2a5d0 --- /dev/null +++ b/params_shard_452.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7aed1ee58b07acf1baa3f53dd6f17f33f79db253cc0aa89ad4aa82f5209e8b9 +size 23511040 diff --git a/params_shard_453.bin b/params_shard_453.bin new file mode 100644 index 0000000000000000000000000000000000000000..2137fb7743925b3dc658706d29d68a9093a69d1f --- /dev/null +++ b/params_shard_453.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9a433d66191068f7a577a56d172ab4c8c8ca8d5a3ef6f203ae3d76a076d9d5 +size 33587200 diff --git a/params_shard_454.bin b/params_shard_454.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2848fa853fb73f51822ba6037041e75716e3477 --- /dev/null +++ b/params_shard_454.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd51795f9f51755f9ee518e88030e337485bebdc42b2c73dcabfe74fede12b4 +size 26869760 diff --git a/params_shard_455.bin b/params_shard_455.bin new file mode 100644 index 0000000000000000000000000000000000000000..a519a3f3ce8b49558c1ea7ae0198e103559114df --- /dev/null +++ b/params_shard_455.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac2f042b2e6ad679ce3df03b0f05527909b0dc12c35e650788dbacf4fccd1672 +size 22712320 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..e37d77c660abf91d5b2ea4d2e4996d68d7bbeb9d --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22c2113cbddf96d75bcce18832baf9e3eaf25af5ec2b58636f6ac605c487f3a +size 188088320 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..6cc82711e520b34eafaceed065578d40256ddca0 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff85f7fd1c507cfc5f0b758e1a4c3506688faae06599c00b4a6b405526d727e6 +size 23511040 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..084fcd3f9779f07cd523f8b80e6b60431a90b862 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b447a9d1ed92be1c8258fdb9862a4786e7643ce0efc608343239d78087fc92 +size 33587200 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..72af9ac0e1958a6c59f723256eeaed07c13fb1aa --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca782d29b5caae1f20dbcf7752badaeb2fad09d724a92ccbbb327ff63a42675 +size 26869760 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..323838392692c185882b60f3484490d942fafbd7 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de17f1f0aa3d5d91d8b7b54c5976bbf30029ab6b0f6bc1dfe9599669d7a4361 +size 188088320 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..263f555a04ebc5c4487b5b765dd3bcd06033e4f0 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857267bbc5c377720c9cf09ab785bbacad4157f4df6b411e4c03d9278308dedd +size 31117312 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..8f3f58923628e7ce99293d186e3c66bf6ef54ff6 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ab30fed9e32f750d44c51849655bbca3b60f044afa6e255dbe12b3d5540e64 +size 93978624 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7307a312ba7602ab79ac0595eec14f9e8c943bf --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a068fdb7a1e8a4fee6c73d6504607b28af91f0c1a97731bc3b0e3d1850691fec +size 188088320 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..239523f9e66fc303dfff7879805b1bc633d2c6ab --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61904df137929e4f42253d27d23c3e9182188ae4d642f4898925b09c48ff40dd +size 23511040 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..1884f5962515703ea04c290812b9ada1bdcbdd4d --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e0f8c54012e30a3060bfa82f0410ce21b50bc0e331b68abacfe162ca12477a +size 33587200 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..759017659e8977f416e9af9b71380d2f0bcf1307 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a9279487ac1ed0c94d3b4307c96d4598187d290661f23009339e4742a312255 +size 26869760 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e775bb2094a3c857fb54dc18d1e84dc5b08bbd0 --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c4c3395ba4efc16dd5c72baf7d1c20228cb5559f5ea6cb921f4b86c8e77cff +size 188088320 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3814f8d495831f546daaf92319594986418d6bb --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51829c1a2607483bb94c5d0d7876067a1a7f7ab279a164e8cf93229ed698b48 +size 23511040 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1f238793515d01035c20db345fb8b2efb5265c9 --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138b1ab65854bcff595a5aa9376605146422e1838283e3588db65297178a408c +size 33587200 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2f425684868f621113754956c5e118f1d3cb004 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4b18d1561030119eff6b6a900b09c8ab3231a3e47fee2f42eea2c02849d33e +size 26869760 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a72761f019f93a9e2d7204e07a9a01965d02c86 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330c23b7e94767f00a7fdd0dead1d193b64a610322d51b080d6526fdea6babcf +size 23511040 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..f84bd07d595e43119cd3ea1512f14bb16f298a8a --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6ecd4734cb0abcdb0a1de0683ee321bbccea01d450308ae6145ebc6f99ca58 +size 93978624 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..f522c3c50cabc63852ee7f1cbb13d708c5f0a9d2 --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56324a82c17b3212880e01861e8f41f300b9f88c580d8d31bf6583fe722c733f +size 30269440 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b8c5372097a4bd87f206968de1b900d60f45729 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948a6eb2a8fa3a8ac8884dd337711293b9208cdace08f2e3d3aa4abe1f26a227 +size 93978624 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3b7880c23eadb069a52fed9c1bd976abd1999da --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ff5911a4315d509948a72541d412d7ebc370e49d0649a360ee4bd98779b978 +size 188088320 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c9e6e6472a0de4616dd5ed7466c5b512400cea6 --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1f94210090fb145acc628a2de05473b10a6c835101b6558a9b61ab1e194a27 +size 23511040 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c010e69dde7fb9bed8ef360e63c0b02fe368818 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d9f7617c118c6f05ebfa9c0e21dc2a243ea2b46bd4bf19f4b6842fb3f490b2 +size 33587200 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..1791d58959c93838a0a1bc77120dcb3b69b120ba --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f2b2b6fbe7a48b66f9a41226128a0f93980fd51a7223c789dd0aad299c1557 +size 26869760 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..2516b9bceba5b5bb0e03b3938c1acd460d68f14c --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963c9d3ad5663d1db018c4306e111ed32df95a228d42aea68e9e74278297bd47 +size 93978624 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..f52facdbcb8882acf026cbdcc11807a0f278357a --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a96c22a183870e9d18ca71b9d100483b08395ee281aadd46056716982bb2144 +size 31117312 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..13b59fdf5c0514bd8dccebdf3b9377ccb948517e --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95307d2e460b57770a884775d4cc1e936b94896b077d4340b581d00c485e9b17 +size 188088320 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ff6701b5da67261274fe408ea2ae3203d327784 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402ed25a084dd1af8e9c0302f4706c90193d523a1e86cea55dfffca205a48846 +size 33587200 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7c9185a02da488f397739d9415c2ef0dff83351 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b5d541932631ca76284cd77a80b54830a315c2c0977a2609f6835e28a387f3 +size 23511040 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..d91bc29c6a98b57911bfd9fcfc39bf18947abbfb --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35429784b67e942e5c90965763eefc3fc03e752be2ad64904623f956b22477ca +size 33587200 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..25558f07fa348d765b829062de7f5d45fb1a5f26 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6faa2d21400bdef31f3cdc4415d45c33dedd49cf24f413798e6375ac4a9c808 +size 26869760 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0c996a9d499cdbfd66609ee1fb98acce300e1f6 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99d19cdc0bf7804b7eb7fb56577c92fc597142893d2069c15caf7e388d41c46 +size 33587200 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..210e940b7d7de6ab10227d0d065a69e3314013bb --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b40a83984154b219255780b85638059d68f93d1cc4dec76474dd04ed9f0af0 +size 26869760 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..8111b626aac5742d650bdad974a37d5954680f1f --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e091b8f97539b6839a86b7b3b947f8d3aa3493604cfc388a5624c157e06fe544 +size 93978624 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d250d3b5d819fe959e6e0f1cdbad08dd096fe35 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053bbd156d4b3e3b140e26cdb231d6cb88016a186984b274b9d495c939324ec3 +size 26894336 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..59c0edb5ba1c335900e19b11f2afd8cdfd2b8ae4 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8ac482310ad9448b30dde42516b1d824516d7af620d3550380ea010a8dcb08 +size 188088320 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..eada5980542cddde91255e4374f2407dd8105c1b --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e4e81c7e3ba6d9a53f5ef08675ed2f45bd6ab9c35f55e72d07880f3d7d2693 +size 23511040 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..f9151d5809b5b78591673ac8df5ea344b26d7efa --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac7acae407f610c31ae445391293f4d07cc50ac6d42bfb8f59c946029fade84f +size 93978624 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..9989aec9b7acf038326152b6313bc52d76125828 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a539ae04c5ef4bbd1f5b96380985b9da0ec10de324a1a0c12007251d81c2a340 +size 26869760 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..7745f3fd8582464daf9de6e6fbee8076adae768c --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1159d311da950bb773584293d3a1b80e80f911caf4cccd9c6eb30545e1c03b +size 188088320 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..6dd50aee573d673d27eb979e32d14ff80735f2aa --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4b4c575e77b162777b5e17cafbda30079809fe0e205b6d5df46566ba195c1e +size 23511040 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ad3b9698f5257ee76c2b9a6e3813964e1b7b476 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9325c9f4006ae547b54f3e6300a872897db44748a881822aa63f935826b283ba +size 33587200 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..77d2169d3f78285913c73cac27ad3355e55dd515 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33163e20bf7ce7b1d16b551fc93759eb1da74229426a4bde5362216bfc8be691 +size 26869760 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..c949ed03c2c202a65037347cb4a004e19d361b39 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0473233dbb7d22b8e96599e4af5277c217511b6fe0bd7c61763d395fe861161e +size 93978624 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..02c220da569fd33e9cbe52e4adf098687771bc5c --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9e573810399b90fb4ca1be7522ff88d92cbd8b1c5831d5c98a10cf0c783bba +size 31117312 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..7272513ee39c85903d242180a4c096e0f9c1e37f --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124c34ba53a1de96ba90260f30d8280f9cec8c5af9dc27fd97a6566f09d042df +size 188088320 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8c02a28cec13bbaa98014af4a246c001666df26 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5920d2b1e9b53d107029a9fb34583320351f0a008998253c818fdb639e900764 +size 23511040 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..baa88412b1736618eba82bfa69689ff787ec2893 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf8c1594c1578b9e543e6d1b326703453bde6a50308f472f2a18ab3708a15a5 +size 33587200 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0dd101e9789659991b998abe4f573d1bda21f1a --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e6f09e7c2a3d90b6beb3b2a4f8c95b4b78c72f0b2ff5f7e17255603edafc9e +size 26869760 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..923d523e1adb600548914267b9e72a9fc7f5cede --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100133fcc2fdf24066e609fd9080db22e09c7fe6169d6db0b8232973eca5af8e +size 188088320 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..623616fe9955d385154c13c76fdcf2fc9864e2d0 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3dc187c43b71410570a031f749af3dbf7c0155a24d9daf49713d8748d79626 +size 33587200 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff787dfa5a69c6c9dfab8bc20f1133f37fbb6c60 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e7b2c04b0515fd17ac94fa4ca3e6cb352f8cd0bf948026dc8622587ad7107a +size 93978624 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..d169b8a8b4f2a482af71ca7d15553636de07208e --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8c4c56c2ad7ea92d1f8654727663e9a8dfd51cb65872a1da4a6e923fb7b12f +size 23535616 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..c62cc8b64083fa7c0de3fae75146612f7ab49a87 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:905f07f7af307cf496f6008fbc2c93af41b0c6e361120a8abe9b2b0f7eecf109 +size 188088320 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..701de3036ea617fa27b9bb11fe0a0c420fce1a99 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee88e870e330d9f1a2676f4596f1ff969cda133516df2b6d0e803e15f8af602 +size 23511040 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2082bd32a2d1202cb1075b1926f77fd344e0c87 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb585110e524178d7767835dcf7b7000fd0f2ec0c3e6b3fa264c85f22fa36fc +size 26869760 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8c96a8a567cb8534de2000a359598f509ac3556 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddcd4900baadce1d0703163f9e9010baab2bab9d2e6121ee81eeaf50bdc2ce2e +size 93978624 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..4bfa5fb629f0cfa34bc45a3adf862d8830040204 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a03092e627f5d6a538809dbc6635e9b08a4ab08b89c269cd5bf5a350ce86f6b2 +size 188088320 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..52e49d1dc24f13b9d8a2ccb111ed6cb7dd64e5e2 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1d02df52cc288838adc673df9ae924f59ad7abf94d6270aa8e502b7bb71875 +size 23511040 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3077c3bbe24e58678f2bf7ff606fbc5a0f264b4 --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae67b8ddaa2a34ce659b18e163fe0fba2ba3b1b7cfef43560f85a65fb1370026 +size 33587200 diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..5c903c017d75658b8abbbf5a4b0ad1d5bb595d55 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,410503 @@ +{ + "version": "1.0", + "truncation": null, + "padding": null, + "added_tokens": [ + { + "id": 128000, + "content": "<|begin_of_text|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128001, + "content": "<|end_of_text|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128002, + "content": "<|reserved_special_token_0|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128003, + "content": "<|reserved_special_token_1|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128004, + "content": "<|reserved_special_token_2|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128005, + "content": "<|reserved_special_token_3|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128006, + "content": "<|start_header_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128007, + "content": "<|end_header_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128008, + "content": "<|reserved_special_token_4|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128009, + "content": "<|eot_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128010, + "content": "<|reserved_special_token_5|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128011, + "content": "<|reserved_special_token_6|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128012, + "content": "<|reserved_special_token_7|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128013, + "content": "<|reserved_special_token_8|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128014, + "content": "<|reserved_special_token_9|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128015, + "content": "<|reserved_special_token_10|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128016, + "content": "<|reserved_special_token_11|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128017, + "content": "<|reserved_special_token_12|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128018, + "content": "<|reserved_special_token_13|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128019, + "content": "<|reserved_special_token_14|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128020, + "content": "<|reserved_special_token_15|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128021, + "content": "<|reserved_special_token_16|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128022, + "content": "<|reserved_special_token_17|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128023, + "content": "<|reserved_special_token_18|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128024, + "content": "<|reserved_special_token_19|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128025, + "content": "<|reserved_special_token_20|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128026, + "content": "<|reserved_special_token_21|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128027, + "content": "<|reserved_special_token_22|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128028, + "content": "<|reserved_special_token_23|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128029, + "content": "<|reserved_special_token_24|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128030, + "content": "<|reserved_special_token_25|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128031, + "content": "<|reserved_special_token_26|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128032, + "content": "<|reserved_special_token_27|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128033, + "content": "<|reserved_special_token_28|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128034, + "content": "<|reserved_special_token_29|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128035, + "content": "<|reserved_special_token_30|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128036, + "content": "<|reserved_special_token_31|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128037, + "content": "<|reserved_special_token_32|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128038, + "content": "<|reserved_special_token_33|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128039, + "content": "<|reserved_special_token_34|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128040, + "content": "<|reserved_special_token_35|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128041, + "content": "<|reserved_special_token_36|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128042, + "content": "<|reserved_special_token_37|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128043, + "content": "<|reserved_special_token_38|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128044, + "content": "<|reserved_special_token_39|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128045, + "content": "<|reserved_special_token_40|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128046, + "content": "<|reserved_special_token_41|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128047, + "content": "<|reserved_special_token_42|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128048, + "content": "<|reserved_special_token_43|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128049, + "content": "<|reserved_special_token_44|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128050, + "content": "<|reserved_special_token_45|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128051, + "content": "<|reserved_special_token_46|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128052, + "content": "<|reserved_special_token_47|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128053, + "content": "<|reserved_special_token_48|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128054, + "content": "<|reserved_special_token_49|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128055, + "content": "<|reserved_special_token_50|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128056, + "content": "<|reserved_special_token_51|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128057, + "content": "<|reserved_special_token_52|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128058, + "content": "<|reserved_special_token_53|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128059, + "content": "<|reserved_special_token_54|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128060, + "content": "<|reserved_special_token_55|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128061, + "content": "<|reserved_special_token_56|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128062, + "content": "<|reserved_special_token_57|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128063, + "content": "<|reserved_special_token_58|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128064, + "content": "<|reserved_special_token_59|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128065, + "content": "<|reserved_special_token_60|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128066, + "content": "<|reserved_special_token_61|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128067, + "content": "<|reserved_special_token_62|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128068, + "content": "<|reserved_special_token_63|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128069, + "content": "<|reserved_special_token_64|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128070, + "content": "<|reserved_special_token_65|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128071, + "content": "<|reserved_special_token_66|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128072, + "content": "<|reserved_special_token_67|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128073, + "content": "<|reserved_special_token_68|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128074, + "content": "<|reserved_special_token_69|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128075, + "content": "<|reserved_special_token_70|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128076, + "content": "<|reserved_special_token_71|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128077, + "content": "<|reserved_special_token_72|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128078, + "content": "<|reserved_special_token_73|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128079, + "content": "<|reserved_special_token_74|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128080, + "content": "<|reserved_special_token_75|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128081, + "content": "<|reserved_special_token_76|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128082, + "content": "<|reserved_special_token_77|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128083, + "content": "<|reserved_special_token_78|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128084, + "content": "<|reserved_special_token_79|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128085, + "content": "<|reserved_special_token_80|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128086, + "content": "<|reserved_special_token_81|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128087, + "content": "<|reserved_special_token_82|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128088, + "content": "<|reserved_special_token_83|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128089, + "content": "<|reserved_special_token_84|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128090, + "content": "<|reserved_special_token_85|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128091, + "content": "<|reserved_special_token_86|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128092, + "content": "<|reserved_special_token_87|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128093, + "content": "<|reserved_special_token_88|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128094, + "content": "<|reserved_special_token_89|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128095, + "content": "<|reserved_special_token_90|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128096, + "content": "<|reserved_special_token_91|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128097, + "content": "<|reserved_special_token_92|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128098, + "content": "<|reserved_special_token_93|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128099, + "content": "<|reserved_special_token_94|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128100, + "content": "<|reserved_special_token_95|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128101, + "content": "<|reserved_special_token_96|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128102, + "content": "<|reserved_special_token_97|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128103, + "content": "<|reserved_special_token_98|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128104, + "content": "<|reserved_special_token_99|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128105, + "content": "<|reserved_special_token_100|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128106, + "content": "<|reserved_special_token_101|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128107, + "content": "<|reserved_special_token_102|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128108, + "content": "<|reserved_special_token_103|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128109, + "content": "<|reserved_special_token_104|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128110, + "content": "<|reserved_special_token_105|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128111, + "content": "<|reserved_special_token_106|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128112, + "content": "<|reserved_special_token_107|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128113, + "content": "<|reserved_special_token_108|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128114, + "content": "<|reserved_special_token_109|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128115, + "content": "<|reserved_special_token_110|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128116, + "content": "<|reserved_special_token_111|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128117, + "content": "<|reserved_special_token_112|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128118, + "content": "<|reserved_special_token_113|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128119, + "content": "<|reserved_special_token_114|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128120, + "content": "<|reserved_special_token_115|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128121, + "content": "<|reserved_special_token_116|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128122, + "content": "<|reserved_special_token_117|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128123, + "content": "<|reserved_special_token_118|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128124, + "content": "<|reserved_special_token_119|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128125, + "content": "<|reserved_special_token_120|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128126, + "content": "<|reserved_special_token_121|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128127, + "content": "<|reserved_special_token_122|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128128, + "content": "<|reserved_special_token_123|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128129, + "content": "<|reserved_special_token_124|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128130, + "content": "<|reserved_special_token_125|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128131, + "content": "<|reserved_special_token_126|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128132, + "content": "<|reserved_special_token_127|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128133, + "content": "<|reserved_special_token_128|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128134, + "content": "<|reserved_special_token_129|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128135, + "content": "<|reserved_special_token_130|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128136, + "content": "<|reserved_special_token_131|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128137, + "content": "<|reserved_special_token_132|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128138, + "content": "<|reserved_special_token_133|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128139, + "content": "<|reserved_special_token_134|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128140, + "content": "<|reserved_special_token_135|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128141, + "content": "<|reserved_special_token_136|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128142, + "content": "<|reserved_special_token_137|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128143, + "content": "<|reserved_special_token_138|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128144, + "content": "<|reserved_special_token_139|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128145, + "content": "<|reserved_special_token_140|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128146, + "content": "<|reserved_special_token_141|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128147, + "content": "<|reserved_special_token_142|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128148, + "content": "<|reserved_special_token_143|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128149, + "content": "<|reserved_special_token_144|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128150, + "content": "<|reserved_special_token_145|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128151, + "content": "<|reserved_special_token_146|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128152, + "content": "<|reserved_special_token_147|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128153, + "content": "<|reserved_special_token_148|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128154, + "content": "<|reserved_special_token_149|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128155, + "content": "<|reserved_special_token_150|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128156, + "content": "<|reserved_special_token_151|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128157, + "content": "<|reserved_special_token_152|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128158, + "content": "<|reserved_special_token_153|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128159, + "content": "<|reserved_special_token_154|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128160, + "content": "<|reserved_special_token_155|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128161, + "content": "<|reserved_special_token_156|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128162, + "content": "<|reserved_special_token_157|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128163, + "content": "<|reserved_special_token_158|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128164, + "content": "<|reserved_special_token_159|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128165, + "content": "<|reserved_special_token_160|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128166, + "content": "<|reserved_special_token_161|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128167, + "content": "<|reserved_special_token_162|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128168, + "content": "<|reserved_special_token_163|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128169, + "content": "<|reserved_special_token_164|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128170, + "content": "<|reserved_special_token_165|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128171, + "content": "<|reserved_special_token_166|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128172, + "content": "<|reserved_special_token_167|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128173, + "content": "<|reserved_special_token_168|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128174, + "content": "<|reserved_special_token_169|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128175, + "content": "<|reserved_special_token_170|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128176, + "content": "<|reserved_special_token_171|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128177, + "content": "<|reserved_special_token_172|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128178, + "content": "<|reserved_special_token_173|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128179, + "content": "<|reserved_special_token_174|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128180, + "content": "<|reserved_special_token_175|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128181, + "content": "<|reserved_special_token_176|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128182, + "content": "<|reserved_special_token_177|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128183, + "content": "<|reserved_special_token_178|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128184, + "content": "<|reserved_special_token_179|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128185, + "content": "<|reserved_special_token_180|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128186, + "content": "<|reserved_special_token_181|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128187, + "content": "<|reserved_special_token_182|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128188, + "content": "<|reserved_special_token_183|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128189, + "content": "<|reserved_special_token_184|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128190, + "content": "<|reserved_special_token_185|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128191, + "content": "<|reserved_special_token_186|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128192, + "content": "<|reserved_special_token_187|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128193, + "content": "<|reserved_special_token_188|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128194, + "content": "<|reserved_special_token_189|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128195, + "content": "<|reserved_special_token_190|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128196, + "content": "<|reserved_special_token_191|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128197, + "content": "<|reserved_special_token_192|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128198, + "content": "<|reserved_special_token_193|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128199, + "content": "<|reserved_special_token_194|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128200, + "content": "<|reserved_special_token_195|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128201, + "content": "<|reserved_special_token_196|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128202, + "content": "<|reserved_special_token_197|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128203, + "content": "<|reserved_special_token_198|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128204, + "content": "<|reserved_special_token_199|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128205, + "content": "<|reserved_special_token_200|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128206, + "content": "<|reserved_special_token_201|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128207, + "content": "<|reserved_special_token_202|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128208, + "content": "<|reserved_special_token_203|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128209, + "content": "<|reserved_special_token_204|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128210, + "content": "<|reserved_special_token_205|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128211, + "content": "<|reserved_special_token_206|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128212, + "content": "<|reserved_special_token_207|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128213, + "content": "<|reserved_special_token_208|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128214, + "content": "<|reserved_special_token_209|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128215, + "content": "<|reserved_special_token_210|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128216, + "content": "<|reserved_special_token_211|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128217, + "content": "<|reserved_special_token_212|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128218, + "content": "<|reserved_special_token_213|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128219, + "content": "<|reserved_special_token_214|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128220, + "content": "<|reserved_special_token_215|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128221, + "content": "<|reserved_special_token_216|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128222, + "content": "<|reserved_special_token_217|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128223, + "content": "<|reserved_special_token_218|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128224, + "content": "<|reserved_special_token_219|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128225, + "content": "<|reserved_special_token_220|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128226, + "content": "<|reserved_special_token_221|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128227, + "content": "<|reserved_special_token_222|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128228, + "content": "<|reserved_special_token_223|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128229, + "content": "<|reserved_special_token_224|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128230, + "content": "<|reserved_special_token_225|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128231, + "content": "<|reserved_special_token_226|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128232, + "content": "<|reserved_special_token_227|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128233, + "content": "<|reserved_special_token_228|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128234, + "content": "<|reserved_special_token_229|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128235, + "content": "<|reserved_special_token_230|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128236, + "content": "<|reserved_special_token_231|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128237, + "content": "<|reserved_special_token_232|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128238, + "content": "<|reserved_special_token_233|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128239, + "content": "<|reserved_special_token_234|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128240, + "content": "<|reserved_special_token_235|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128241, + "content": "<|reserved_special_token_236|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128242, + "content": "<|reserved_special_token_237|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128243, + "content": "<|reserved_special_token_238|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128244, + "content": "<|reserved_special_token_239|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128245, + "content": "<|reserved_special_token_240|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128246, + "content": "<|reserved_special_token_241|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128247, + "content": "<|reserved_special_token_242|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128248, + "content": "<|reserved_special_token_243|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128249, + "content": "<|reserved_special_token_244|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128250, + "content": "<|reserved_special_token_245|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128251, + "content": "<|reserved_special_token_246|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128252, + "content": "<|reserved_special_token_247|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128253, + "content": "<|reserved_special_token_248|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128254, + "content": "<|reserved_special_token_249|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128255, + "content": "<|reserved_special_token_250|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + } + ], + "normalizer": null, + "pre_tokenizer": { + "type": "Sequence", + "pretokenizers": [ + { + "type": "Split", + "pattern": { + "Regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?\\p{L}+|\\p{N}{1,3}| ?[^\\s\\p{L}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+" + }, + "behavior": "Isolated", + "invert": false + }, + { + "type": "ByteLevel", + "add_prefix_space": false, + "trim_offsets": true, + "use_regex": false + } + ] + }, + "post_processor": { + "type": "ByteLevel", + "add_prefix_space": true, + "trim_offsets": false, + "use_regex": true + }, + "decoder": { + "type": "ByteLevel", + "add_prefix_space": true, + "trim_offsets": true, + "use_regex": true + }, + "model": { + "type": "BPE", + "dropout": null, + "unk_token": null, + "continuing_subword_prefix": null, + "end_of_word_suffix": null, + "fuse_unk": false, + "byte_fallback": false, + "vocab": { + "!": 0, + "\"": 1, + "#": 2, + "$": 3, + "%": 4, + "&": 5, + "'": 6, + "(": 7, + ")": 8, + "*": 9, + "+": 10, + ",": 11, + "-": 12, + ".": 13, + "/": 14, + "0": 15, + "1": 16, + "2": 17, + "3": 18, + "4": 19, + "5": 20, + "6": 21, + "7": 22, + "8": 23, + "9": 24, + ":": 25, + ";": 26, + "<": 27, + "=": 28, + ">": 29, + "?": 30, + "@": 31, + "A": 32, + "B": 33, + "C": 34, + "D": 35, + "E": 36, + "F": 37, + "G": 38, + "H": 39, + "I": 40, + "J": 41, + "K": 42, + "L": 43, + "M": 44, + "N": 45, + "O": 46, + "P": 47, + "Q": 48, + "R": 49, + "S": 50, + "T": 51, + "U": 52, + "V": 53, + "W": 54, + "X": 55, + "Y": 56, + "Z": 57, + "[": 58, + "\\": 59, + "]": 60, + "^": 61, + "_": 62, + "`": 63, + "a": 64, + "b": 65, + "c": 66, + "d": 67, + "e": 68, + "f": 69, + "g": 70, + "h": 71, + "i": 72, + "j": 73, + "k": 74, + "l": 75, + "m": 76, + "n": 77, + "o": 78, + "p": 79, + "q": 80, + "r": 81, + "s": 82, + "t": 83, + "u": 84, + "v": 85, + "w": 86, + "x": 87, + "y": 88, + "z": 89, + "{": 90, + "|": 91, + "}": 92, + "~": 93, + "¡": 94, + "¢": 95, + "£": 96, + "¤": 97, + "¥": 98, + "¦": 99, + "§": 100, + "¨": 101, + "©": 102, + "ª": 103, + "«": 104, + "¬": 105, + "®": 106, + "¯": 107, + "°": 108, + "±": 109, + "²": 110, + "³": 111, + "´": 112, + "µ": 113, + "¶": 114, + "·": 115, + "¸": 116, + "¹": 117, + "º": 118, + "»": 119, + "¼": 120, + "½": 121, + "¾": 122, + "¿": 123, + "À": 124, + "Á": 125, + "Â": 126, + "Ã": 127, + "Ä": 128, + "Å": 129, + "Æ": 130, + "Ç": 131, + "È": 132, + "É": 133, + "Ê": 134, + "Ë": 135, + "Ì": 136, + "Í": 137, + "Î": 138, + "Ï": 139, + "Ð": 140, + "Ñ": 141, + "Ò": 142, + "Ó": 143, + "Ô": 144, + "Õ": 145, + "Ö": 146, + "×": 147, + "Ø": 148, + "Ù": 149, + "Ú": 150, + "Û": 151, + "Ü": 152, + "Ý": 153, + "Þ": 154, + "ß": 155, + "à": 156, + "á": 157, + "â": 158, + "ã": 159, + "ä": 160, + "å": 161, + "æ": 162, + "ç": 163, + "è": 164, + "é": 165, + "ê": 166, + "ë": 167, + "ì": 168, + "í": 169, + "î": 170, + "ï": 171, + "ð": 172, + "ñ": 173, + "ò": 174, + "ó": 175, + "ô": 176, + "õ": 177, + "ö": 178, + "÷": 179, + "ø": 180, + "ù": 181, + "ú": 182, + "û": 183, + "ü": 184, + "ý": 185, + "þ": 186, + "ÿ": 187, + "Ā": 188, + "ā": 189, + "Ă": 190, + "ă": 191, + "Ą": 192, + "ą": 193, + "Ć": 194, + "ć": 195, + "Ĉ": 196, + "ĉ": 197, + "Ċ": 198, + "ċ": 199, + "Č": 200, + "č": 201, + "Ď": 202, + "ď": 203, + "Đ": 204, + "đ": 205, + "Ē": 206, + "ē": 207, + "Ĕ": 208, + "ĕ": 209, + "Ė": 210, + "ė": 211, + "Ę": 212, + "ę": 213, + "Ě": 214, + "ě": 215, + "Ĝ": 216, + "ĝ": 217, + "Ğ": 218, + "ğ": 219, + "Ġ": 220, + "ġ": 221, + "Ģ": 222, + "ģ": 223, + "Ĥ": 224, + "ĥ": 225, + "Ħ": 226, + "ħ": 227, + "Ĩ": 228, + "ĩ": 229, + "Ī": 230, + "ī": 231, + "Ĭ": 232, + "ĭ": 233, + "Į": 234, + "į": 235, + "İ": 236, + "ı": 237, + "IJ": 238, + "ij": 239, + "Ĵ": 240, + "ĵ": 241, + "Ķ": 242, + "ķ": 243, + "ĸ": 244, + "Ĺ": 245, + "ĺ": 246, + "Ļ": 247, + "ļ": 248, + "Ľ": 249, + "ľ": 250, + "Ŀ": 251, + "ŀ": 252, + "Ł": 253, + "ł": 254, + "Ń": 255, + "ĠĠ": 256, + "ĠĠĠĠ": 257, + "in": 258, + "Ġt": 259, + "ĠĠĠĠĠĠĠĠ": 260, + "er": 261, + "ĠĠĠ": 262, + "on": 263, + "Ġa": 264, + "re": 265, + "at": 266, + "st": 267, + "en": 268, + "or": 269, + "Ġth": 270, + "ĊĊ": 271, + "Ġc": 272, + "le": 273, + "Ġs": 274, + "it": 275, + "an": 276, + "ar": 277, + "al": 278, + "Ġthe": 279, + ";Ċ": 280, + "Ġp": 281, + "Ġf": 282, + "ou": 283, + "Ġ=": 284, + "is": 285, + "ĠĠĠĠĠĠĠ": 286, + "ing": 287, + "es": 288, + "Ġw": 289, + "ion": 290, + "ed": 291, + "ic": 292, + "Ġb": 293, + "Ġd": 294, + "et": 295, + "Ġm": 296, + "Ġo": 297, + "ĉĉ": 298, + "ro": 299, + "as": 300, + "el": 301, + "ct": 302, + "nd": 303, + "Ġin": 304, + "Ġh": 305, + "ent": 306, + "id": 307, + "Ġn": 308, + "am": 309, + "ĠĠĠĠĠĠĠĠĠĠĠ": 310, + "Ġto": 311, + "Ġre": 312, + "--": 313, + "Ġ{": 314, + "Ġof": 315, + "om": 316, + ");Ċ": 317, + "im": 318, + "čĊ": 319, + "Ġ(": 320, + "il": 321, + "//": 322, + "Ġand": 323, + "ur": 324, + "se": 325, + "Ġl": 326, + "ex": 327, + "ĠS": 328, + "ad": 329, + "Ġ\"": 330, + "ch": 331, + "ut": 332, + "if": 333, + "**": 334, + "Ġ}": 335, + "em": 336, + "ol": 337, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 338, + "th": 339, + ")Ċ": 340, + "Ġ{Ċ": 341, + "Ġg": 342, + "ig": 343, + "iv": 344, + ",Ċ": 345, + "ce": 346, + "od": 347, + "Ġv": 348, + "ate": 349, + "ĠT": 350, + "ag": 351, + "ay": 352, + "Ġ*": 353, + "ot": 354, + "us": 355, + "ĠC": 356, + "Ġst": 357, + "ĠI": 358, + "un": 359, + "ul": 360, + "ue": 361, + "ĠA": 362, + "ow": 363, + "Ġ'": 364, + "ew": 365, + "Ġ<": 366, + "ation": 367, + "()": 368, + "Ġfor": 369, + "ab": 370, + "ort": 371, + "um": 372, + "ame": 373, + "Ġis": 374, + "pe": 375, + "tr": 376, + "ck": 377, + "âĢ": 378, + "Ġy": 379, + "ist": 380, + "----": 381, + ".ĊĊ": 382, + "he": 383, + "Ġe": 384, + "lo": 385, + "ĠM": 386, + "Ġbe": 387, + "ers": 388, + "Ġon": 389, + "Ġcon": 390, + "ap": 391, + "ub": 392, + "ĠP": 393, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 394, + "ass": 395, + "int": 396, + ">Ċ": 397, + "ly": 398, + "urn": 399, + "Ġ$": 400, + ";ĊĊ": 401, + "av": 402, + "port": 403, + "ir": 404, + "->": 405, + "nt": 406, + "ction": 407, + "end": 408, + "Ġde": 409, + "00": 410, + "ith": 411, + "out": 412, + "turn": 413, + "our": 414, + "ĠĠĠĠĠ": 415, + "lic": 416, + "res": 417, + "pt": 418, + "==": 419, + "Ġthis": 420, + "Ġwh": 421, + "Ġif": 422, + "ĠD": 423, + "ver": 424, + "age": 425, + "ĠB": 426, + "ht": 427, + "ext": 428, + "=\"": 429, + "Ġthat": 430, + "****": 431, + "ĠR": 432, + "Ġit": 433, + "ess": 434, + "ĠF": 435, + "Ġr": 436, + "os": 437, + "and": 438, + "Ġas": 439, + "ect": 440, + "ke": 441, + "rom": 442, + "Ġ//": 443, + "con": 444, + "ĠL": 445, + "(\"": 446, + "qu": 447, + "lass": 448, + "Ġwith": 449, + "iz": 450, + "de": 451, + "ĠN": 452, + "Ġal": 453, + "op": 454, + "up": 455, + "get": 456, + "Ġ}Ċ": 457, + "ile": 458, + "Ġan": 459, + "ata": 460, + "ore": 461, + "ri": 462, + "Ġpro": 463, + ";čĊ": 464, + "ĉĉĉĉ": 465, + "ter": 466, + "ain": 467, + "ĠW": 468, + "ĠE": 469, + "Ġcom": 470, + "Ġreturn": 471, + "art": 472, + "ĠH": 473, + "ack": 474, + "import": 475, + "ublic": 476, + "Ġor": 477, + "est": 478, + "ment": 479, + "ĠG": 480, + "able": 481, + "Ġ-": 482, + "ine": 483, + "ill": 484, + "ind": 485, + "ere": 486, + "::": 487, + "ity": 488, + "Ġ+": 489, + "Ġtr": 490, + "elf": 491, + "ight": 492, + "('": 493, + "orm": 494, + "ult": 495, + "str": 496, + "..": 497, + "\",": 498, + "Ġyou": 499, + "ype": 500, + "pl": 501, + "Ġnew": 502, + "Ġj": 503, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 504, + "Ġfrom": 505, + "Ġex": 506, + "ĠO": 507, + "20": 508, + "ld": 509, + "Ġ[": 510, + "oc": 511, + ":Ċ": 512, + "Ġse": 513, + "Ġle": 514, + "--------": 515, + ".s": 516, + "{Ċ": 517, + "',": 518, + "ant": 519, + "Ġat": 520, + "ase": 521, + ".c": 522, + "Ġch": 523, + "": 524, + "ave": 525, + "ang": 526, + "Ġare": 527, + "Ġint": 528, + "âĢĻ": 529, + "_t": 530, + "ert": 531, + "ial": 532, + "act": 533, + "}Ċ": 534, + "ive": 535, + "ode": 536, + "ost": 537, + "Ġclass": 538, + "Ġnot": 539, + "og": 540, + "ord": 541, + "alue": 542, + "all": 543, + "ff": 544, + "();Ċ": 545, + "ont": 546, + "ime": 547, + "are": 548, + "ĠU": 549, + "Ġpr": 550, + "Ġ:": 551, + "ies": 552, + "ize": 553, + "ure": 554, + "Ġby": 555, + "ire": 556, + "Ġ}ĊĊ": 557, + ".p": 558, + "Ġsh": 559, + "ice": 560, + "ast": 561, + "ption": 562, + "tring": 563, + "ok": 564, + "__": 565, + "cl": 566, + "##": 567, + "Ġhe": 568, + "ard": 569, + ").": 570, + "Ġ@": 571, + "iew": 572, + "ĉĉĉ": 573, + "Ġwas": 574, + "ip": 575, + "this": 576, + "Ġu": 577, + "ĠThe": 578, + "ide": 579, + "ace": 580, + "ib": 581, + "ac": 582, + "rou": 583, + "Ġwe": 584, + "ject": 585, + "Ġpublic": 586, + "ak": 587, + "ve": 588, + "ath": 589, + "oid": 590, + "Ġ=>": 591, + "ust": 592, + "que": 593, + "Ġres": 594, + "))": 595, + "'s": 596, + "Ġk": 597, + "ans": 598, + "yst": 599, + "unction": 600, + "********": 601, + "Ġi": 602, + "Ġus": 603, + "pp": 604, + "10": 605, + "one": 606, + "ail": 607, + "====": 608, + "name": 609, + "Ġstr": 610, + "Ġ/": 611, + "Ġ&": 612, + "ach": 613, + "div": 614, + "ystem": 615, + "ell": 616, + "Ġhave": 617, + "err": 618, + "ould": 619, + "ull": 620, + "pon": 621, + "ĠJ": 622, + "_p": 623, + "Ġ==": 624, + "ign": 625, + "St": 626, + ".Ċ": 627, + "Ġpl": 628, + ");ĊĊ": 629, + "form": 630, + "put": 631, + "ount": 632, + "}ĊĊ": 633, + "dd": 634, + "ite": 635, + "Ġget": 636, + "rr": 637, + "ome": 638, + "ĠâĢ": 639, + "aram": 640, + "cc": 641, + "Ġ*/": 642, + "ER": 643, + "In": 644, + "les": 645, + "_s": 646, + "ong": 647, + "ie": 648, + "Ġcan": 649, + "ĠV": 650, + "erv": 651, + "pr": 652, + "Ġun": 653, + "row": 654, + "ber": 655, + "Ġdo": 656, + "ll": 657, + "Ġel": 658, + "Ġself": 659, + "ated": 660, + "ary": 661, + "Ġ.": 662, + "']": 663, + "ud": 664, + "Ġen": 665, + "ĠTh": 666, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 667, + "te": 668, + "_c": 669, + "uct": 670, + "Ġab": 671, + "ork": 672, + ".get": 673, + "Ġ#": 674, + "aw": 675, + "ress": 676, + "ob": 677, + "Name": 678, + "201": 679, + "app": 680, + "['": 681, + "Ġall": 682, + "ory": 683, + "ition": 684, + "ance": 685, + "ear": 686, + "Ġcont": 687, + "vent": 688, + "ia": 689, + "Ġwill": 690, + "IN": 691, + "ĠĠĠĠĠĠĠĠĠ": 692, + "return": 693, + "Ġ": 694, + "data": 695, + ")ĊĊ": 696, + "Re": 697, + "ple": 698, + "ild": 699, + "ther": 700, + "Ġyour": 701, + "\"Ċ": 702, + "($": 703, + "Ġout": 704, + "),": 705, + "Ġhas": 706, + "String": 707, + "so": 708, + "Ġup": 709, + "ax": 710, + "Ġdef": 711, + "Ġbo": 712, + "ge": 713, + "alse": 714, + "ON": 715, + "per": 716, + "12": 717, + "ich": 718, + "Ġbut": 719, + "ĠĊ": 720, + "Ġ_": 721, + "_m": 722, + "add": 723, + "quest": 724, + "odel": 725, + "self": 726, + "ery": 727, + "ft": 728, + "ens": 729, + "////": 730, + "ake": 731, + ".C": 732, + "Ġgo": 733, + "Ġfunction": 734, + "ĠK": 735, + "ivate": 736, + "Ġim": 737, + "Ġconst": 738, + ".t": 739, + "Ġ*/Ċ": 740, + ");čĊ": 741, + "Ġvoid": 742, + "Ġset": 743, + "ĠSystem": 744, + "cri": 745, + "()Ċ": 746, + "li": 747, + "ĉif": 748, + ".m": 749, + "ally": 750, + "set": 751, + "ep": 752, + "âĢĻs": 753, + "bo": 754, + "def": 755, + "',Ċ": 756, + "Ġme": 757, + "Ġ!": 758, + "atch": 759, + "\">": 760, + "\",Ċ": 761, + "ec": 762, + "ĠIn": 763, + "ph": 764, + "Ġ|": 765, + "_f": 766, + "Ġvar": 767, + "ence": 768, + "Id": 769, + "ree": 770, + "ink": 771, + "lect": 772, + "ug": 773, + "eth": 774, + "Ġelse": 775, + "----------------": 776, + "19": 777, + "cont": 778, + "Ġso": 779, + "atic": 780, + "Ġlo": 781, + "pro": 782, + "ton": 783, + "ss": 784, + "own": 785, + "abel": 786, + "oint": 787, + "ous": 788, + "eld": 789, + "ST": 790, + "The": 791, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 792, + "RE": 793, + "\":": 794, + "olor": 795, + "tp": 796, + "eg": 797, + "key": 798, + "ude": 799, + "ĠSt": 800, + "ound": 801, + "Ġar": 802, + "\");Ċ": 803, + "ener": 804, + "ser": 805, + "11": 806, + "bject": 807, + "essage": 808, + "fer": 809, + "Ġmore": 810, + "ations": 811, + "ents": 812, + "Ġhis": 813, + "Ġthey": 814, + ".S": 815, + "ĠY": 816, + "use": 817, + "ne": 818, + "ish": 819, + "old": 820, + "_d": 821, + "io": 822, + "ield": 823, + "Ġper": 824, + "Cont": 825, + "ings": 826, + "####": 827, + "Ġdata": 828, + "Ġsa": 829, + "ef": 830, + "fo": 831, + "Ġone": 832, + "eng": 833, + "Ġdis": 834, + "AT": 835, + "Ġname": 836, + "Ġtrue": 837, + "val": 838, + "led": 839, + ".f": 840, + "Ġne": 841, + "Ġend": 842, + "32": 843, + ".T": 844, + "16": 845, + "cre": 846, + "ark": 847, + "log": 848, + "Ex": 849, + "error": 850, + "_id": 851, + "urre": 852, + "ange": 853, + "Ġnull": 854, + "rray": 855, + "Ġmy": 856, + "pan": 857, + "ict": 858, + "ator": 859, + "View": 860, + "List": 861, + "ĉreturn": 862, + "âĢĿ": 863, + "Ġpre": 864, + "Ġx": 865, + "clude": 866, + "arg": 867, + "15": 868, + "ov": 869, + ".h": 870, + "Ġ>": 871, + "Ġtheir": 872, + "')": 873, + "irst": 874, + "ick": 875, + "gh": 876, + "LE": 877, + "OR": 878, + "Ġprivate": 879, + "tem": 880, + "čĊčĊ": 881, + "user": 882, + "Ġ)": 883, + "com": 884, + ".A": 885, + "\";Ċ": 886, + "Ġid": 887, + "read": 888, + "Ġwho": 889, + "_b": 890, + "\">Ċ": 891, + "Ġtime": 892, + "Ġman": 893, + "ry": 894, + "========": 895, + "roup": 896, + "rop": 897, + "public": 898, + "vel": 899, + "umber": 900, + "ble": 901, + "Ġwhich": 902, + "****************": 903, + "Ġany": 904, + "Ġfalse": 905, + "we": 906, + "Ġvalue": 907, + "Ġli": 908, + "\")": 909, + "nder": 910, + "gr": 911, + "Ġno": 912, + "param": 913, + "25": 914, + "fig": 915, + ".com": 916, + "Ġapp": 917, + "_l": 918, + "ions": 919, + ".D": 920, + "ĠCh": 921, + "Ġabout": 922, + "Ġadd": 923, + "Ġsu": 924, + "Ġstring": 925, + "ID": 926, + "Ġover": 927, + "string": 928, + ".l": 929, + "ource": 930, + "000": 931, + "_C": 932, + "]Ċ": 933, + "Ġqu": 934, + "ĠString": 935, + "ca": 936, + "SE": 937, + "Ġro": 938, + "sh": 939, + "ual": 940, + "Type": 941, + "son": 942, + "new": 943, + "ern": 944, + "Ġag": 945, + "AR": 946, + "];Ċ": 947, + "].": 948, + "Ġ?": 949, + "ical": 950, + "Ġdes": 951, + "uth": 952, + "ix": 953, + "ays": 954, + "Ġtype": 955, + "'t": 956, + "ault": 957, + "Ġinter": 958, + "var": 959, + ".b": 960, + "Ġpart": 961, + ".d": 962, + "urrent": 963, + "IT": 964, + "EN": 965, + "30": 966, + "enc": 967, + "(f": 968, + "ra": 969, + "value": 970, + "cho": 971, + "18": 972, + "utton": 973, + "ose": 974, + "14": 975, + "Ġ!=": 976, + "ater": 977, + "é": 978, + "reate": 979, + "oll": 980, + "pos": 981, + "yle": 982, + "ng": 983, + "AL": 984, + "using": 985, + "ames": 986, + "Ġ{čĊ": 987, + "ates": 988, + "ely": 989, + "Ġwork": 990, + "Ġem": 991, + "inal": 992, + "Ġsp": 993, + "Ġwhen": 994, + ".set": 995, + "ĠĠĠĠĠĠ": 996, + "):Ċ": 997, + "to": 998, + "quire": 999, + "indow": 1000, + "lement": 1001, + "pect": 1002, + "ash": 1003, + "[i": 1004, + "Ġuse": 1005, + ".F": 1006, + "pec": 1007, + "Ġad": 1008, + "ove": 1009, + "ception": 1010, + "ength": 1011, + "include": 1012, + "ader": 1013, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1014, + "atus": 1015, + "Th": 1016, + "itle": 1017, + "rit": 1018, + "void": 1019, + "().": 1020, + "(Ċ": 1021, + "Ġoff": 1022, + "Ġother": 1023, + "Ġ&&": 1024, + "';Ċ": 1025, + "ms": 1026, + "Ġbeen": 1027, + "Ġte": 1028, + "ml": 1029, + "co": 1030, + "nc": 1031, + "13": 1032, + "ervice": 1033, + "Ġ%": 1034, + "**Ċ": 1035, + "ann": 1036, + "ade": 1037, + "ĊĊĊĊ": 1038, + "lock": 1039, + "const": 1040, + "100": 1041, + "ponse": 1042, + "Ġsup": 1043, + "++": 1044, + "date": 1045, + "Ġacc": 1046, + "Ġhad": 1047, + "Ġbu": 1048, + "200": 1049, + "ĠRe": 1050, + "Ġwere": 1051, + "Ġfile": 1052, + "Ġwould": 1053, + "ĠâĢľ": 1054, + "ven": 1055, + "iss": 1056, + "Ġour": 1057, + "class": 1058, + "raw": 1059, + "Ġyear": 1060, + "Data": 1061, + "Ġval": 1062, + "Ġsome": 1063, + "fter": 1064, + "ys": 1065, + "Ġ///": 1066, + "round": 1067, + "view": 1068, + "Ġpe": 1069, + "Ġthere": 1070, + "Ġsaid": 1071, + "du": 1072, + "of": 1073, + "line": 1074, + "/*": 1075, + "duct": 1076, + "Ġher": 1077, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1078, + "Res": 1079, + "Ġco": 1080, + "Ġcomm": 1081, + "ise": 1082, + "min": 1083, + "ĠĠĠĠĊ": 1084, + "#include": 1085, + "ethod": 1086, + ".P": 1087, + "ute": 1088, + "Ġass": 1089, + "Int": 1090, + "ask": 1091, + "loc": 1092, + "Ġlike": 1093, + "ody": 1094, + "Ġlet": 1095, + "load": 1096, + "Ġam": 1097, + "rol": 1098, + "Ġgr": 1099, + "yp": 1100, + "Ġalso": 1101, + "ĠIt": 1102, + "url": 1103, + "ific": 1104, + "ors": 1105, + "_P": 1106, + "_n": 1107, + "igh": 1108, + "Ġthan": 1109, + "Com": 1110, + "AN": 1111, + "UL": 1112, + "ating": 1113, + "17": 1114, + "ĠThis": 1115, + "ref": 1116, + "_S": 1117, + "Ġstatic": 1118, + "roll": 1119, + "Ġjust": 1120, + "Ġresult": 1121, + "ian": 1122, + "idth": 1123, + "Ġthem": 1124, + "));Ċ": 1125, + "der": 1126, + "reak": 1127, + "Con": 1128, + "://": 1129, + "ule": 1130, + "...": 1131, + "arch": 1132, + "ement": 1133, + "Ġ<<": 1134, + "50": 1135, + "ush": 1136, + "ense": 1137, + "arr": 1138, + "Ġinto": 1139, + "cess": 1140, + "amp": 1141, + "ied": 1142, + "ument": 1143, + "Ġ\\": 1144, + "],": 1145, + "wo": 1146, + "als": 1147, + "Ġwhat": 1148, + "anc": 1149, + "Value": 1150, + "='": 1151, + "olum": 1152, + "Ġpos": 1153, + "ages": 1154, + "ayer": 1155, + "Ġsc": 1156, + "ues": 1157, + "\")Ċ": 1158, + "_T": 1159, + "Ġlist": 1160, + "(s": 1161, + "Ġcase": 1162, + "Ch": 1163, + "ĉĉĉĉĉ": 1164, + "////////": 1165, + "ponent": 1166, + "Ġz": 1167, + "Ġkn": 1168, + "let": 1169, + "DE": 1170, + "red": 1171, + "Ġfe": 1172, + "Ġ},Ċ": 1173, + "Ġ,": 1174, + "(t": 1175, + "Ġfirst": 1176, + "');Ċ": 1177, + "word": 1178, + "Ġimport": 1179, + "Ġact": 1180, + "Ġchar": 1181, + "CT": 1182, + "ĠTr": 1183, + "ople": 1184, + "={": 1185, + "ĉf": 1186, + "24": 1187, + "ient": 1188, + "cent": 1189, + ".j": 1190, + "lection": 1191, + "))Ċ": 1192, + "Ġonly": 1193, + "Ġprint": 1194, + "mer": 1195, + ".W": 1196, + "ock": 1197, + "Ġ--": 1198, + "Text": 1199, + "Ġop": 1200, + "ank": 1201, + "Ġits": 1202, + "Ġback": 1203, + "[\"": 1204, + "Ġneed": 1205, + "Ġcl": 1206, + "Ġsub": 1207, + "Ġla": 1208, + "((": 1209, + ".\"": 1210, + "Object": 1211, + "Ġstart": 1212, + "file": 1213, + "(self": 1214, + "ner": 1215, + "ey": 1216, + "Ġuser": 1217, + "Ġent": 1218, + "ĠCom": 1219, + "its": 1220, + "ĠCon": 1221, + "ouble": 1222, + "ower": 1223, + "item": 1224, + "very": 1225, + "ĠWe": 1226, + "64": 1227, + "lick": 1228, + "ĠQ": 1229, + "php": 1230, + "ttp": 1231, + "':": 1232, + "ics": 1233, + "Ġunder": 1234, + "Ġ*Ċ": 1235, + ".L": 1236, + ");": 1237, + "ices": 1238, + "Ġreg": 1239, + ")čĊ": 1240, + "ĉpublic": 1241, + "SS": 1242, + "Ġthen": 1243, + "reat": 1244, + "ious": 1245, + ".G": 1246, + "ek": 1247, + "irect": 1248, + "heck": 1249, + "cript": 1250, + "ning": 1251, + "ĠUn": 1252, + "Ġmay": 1253, + "ĠWh": 1254, + "Bo": 1255, + "Item": 1256, + "struct": 1257, + ".st": 1258, + "ream": 1259, + "ible": 1260, + "loat": 1261, + "Ġorg": 1262, + "und": 1263, + "sum": 1264, + "_in": 1265, + "../": 1266, + "_M": 1267, + "Ġhow": 1268, + "rite": 1269, + "'Ċ": 1270, + "To": 1271, + "40": 1272, + "ww": 1273, + "Ġpeople": 1274, + "index": 1275, + ".n": 1276, + "http": 1277, + "(m": 1278, + "ector": 1279, + "Ġind": 1280, + "Ġjav": 1281, + "],Ċ": 1282, + "ĠHe": 1283, + "_st": 1284, + "ful": 1285, + "ole": 1286, + "){Ċ": 1287, + "Ġshould": 1288, + "opy": 1289, + "elp": 1290, + "ier": 1291, + "_name": 1292, + "erson": 1293, + "ION": 1294, + "ote": 1295, + "Ġtest": 1296, + "Ġbet": 1297, + "rror": 1298, + "ular": 1299, + "ãĢ": 1300, + "ĠÐ": 1301, + "bs": 1302, + "ting": 1303, + "Ġmake": 1304, + "Tr": 1305, + "Ġafter": 1306, + "arget": 1307, + "RO": 1308, + "olumn": 1309, + "rc": 1310, + "_re": 1311, + "define": 1312, + "22": 1313, + "Ġright": 1314, + "right": 1315, + "day": 1316, + "Ġlong": 1317, + "[]": 1318, + "(p": 1319, + "td": 1320, + "cond": 1321, + "ĠPro": 1322, + "Ġrem": 1323, + "ptions": 1324, + "vid": 1325, + ".g": 1326, + "Ġext": 1327, + "Ġ__": 1328, + "')Ċ": 1329, + "pace": 1330, + "mp": 1331, + "Ġmin": 1332, + "stance": 1333, + "air": 1334, + "action": 1335, + "wh": 1336, + "type": 1337, + "util": 1338, + "ait": 1339, + "": 1340, + "IC": 1341, + "text": 1342, + "Ġph": 1343, + "Ġfl": 1344, + ".M": 1345, + "ccess": 1346, + "br": 1347, + "fore": 1348, + "ersion": 1349, + "),Ċ": 1350, + ".re": 1351, + "ateg": 1352, + "Ġloc": 1353, + "ins": 1354, + "-s": 1355, + "trib": 1356, + "ĠInt": 1357, + "Ġarray": 1358, + ",\"": 1359, + "Pro": 1360, + "(c": 1361, + "ession": 1362, + ">ĊĊ": 1363, + "Ġshe": 1364, + "\"]": 1365, + "aph": 1366, + "Ġexp": 1367, + "erty": 1368, + "ĠSe": 1369, + "Ġpar": 1370, + "unc": 1371, + "ET": 1372, + "Ġread": 1373, + "print": 1374, + "Ġrel": 1375, + "Ġform": 1376, + "Ġdr": 1377, + "Exception": 1378, + "input": 1379, + "Ġtrans": 1380, + "########": 1381, + "order": 1382, + "By": 1383, + "Ġaw": 1384, + "ities": 1385, + "uff": 1386, + "play": 1387, + ".add": 1388, + "ĠâĢĵ": 1389, + "Ġwant": 1390, + "Ġcomp": 1391, + "ments": 1392, + "Ġ||": 1393, + "az": 1394, + "be": 1395, + "Ġnumber": 1396, + "Ġrequire": 1397, + "ĠEx": 1398, + "60": 1399, + "Ġcol": 1400, + "Ġkey": 1401, + "ember": 1402, + "Ġtwo": 1403, + "Ġsize": 1404, + "Ġwhere": 1405, + "UT": 1406, + "result": 1407, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1408, + "ough": 1409, + "orld": 1410, + "ood": 1411, + "uch": 1412, + "ative": 1413, + "ger": 1414, + "arent": 1415, + "Ġ/*": 1416, + "Ġarg": 1417, + "Ġwhile": 1418, + "23": 1419, + "(this": 1420, + "Ġrec": 1421, + "Ġdif": 1422, + "State": 1423, + "Ġspec": 1424, + "ride": 1425, + "_F": 1426, + "Ġlook": 1427, + "AM": 1428, + "ility": 1429, + "eter": 1430, + "âĢĻt": 1431, + "ĊĊĊ": 1432, + "ayout": 1433, + "--------------------------------": 1434, + "ager": 1435, + "Ġcould": 1436, + "Ġbr": 1437, + "ends": 1438, + "ures": 1439, + "Ġknow": 1440, + "ets": 1441, + "ĠIf": 1442, + "ĠSh": 1443, + ".w": 1444, + "back": 1445, + "Ġser": 1446, + "Ġ+=": 1447, + "Ġfr": 1448, + "());Ċ": 1449, + "Ġhand": 1450, + "Ind": 1451, + "ULL": 1452, + "Im": 1453, + "();ĊĊ": 1454, + "Ġmost": 1455, + "Ġtry": 1456, + "Ġnow": 1457, + "rough": 1458, + ">čĊ": 1459, + "ackage": 1460, + "Ġhim": 1461, + "._": 1462, + "ify": 1463, + "Ġbreak": 1464, + "Ġ);Ċ": 1465, + "ren": 1466, + "#define": 1467, + "itt": 1468, + "Ġap": 1469, + "ĉc": 1470, + "(n": 1471, + "ĠYou": 1472, + ":ĊĊ": 1473, + "-m": 1474, + "Ġevery": 1475, + "ustom": 1476, + "lient": 1477, + "ocument": 1478, + "cription": 1479, + "Error": 1480, + "-b": 1481, + "о": 1482, + "][": 1483, + "99": 1484, + "trans": 1485, + "Ġpoint": 1486, + "Ġstd": 1487, + "Ġfil": 1488, + "Time": 1489, + "80": 1490, + "Ġmod": 1491, + "Ġ->": 1492, + "Ġerror": 1493, + "ah": 1494, + "Ġtext": 1495, + "roller": 1496, + "lose": 1497, + "ql": 1498, + "Ġpol": 1499, + ">": 1500, + "Ġshow": 1501, + "User": 1502, + "ased": 1503, + "Ġ{ĊĊ": 1504, + "Ġfind": 1505, + "а": 1506, + "ED": 1507, + "span": 1508, + "enu": 1509, + "Ġcurrent": 1510, + "Ġused": 1511, + "cept": 1512, + "clud": 1513, + "Ġplay": 1514, + "Ġlog": 1515, + "ution": 1516, + "fl": 1517, + "Ġsee": 1518, + "indows": 1519, + "Ġhelp": 1520, + "Ġthese": 1521, + "Ġpass": 1522, + "Ġdown": 1523, + "Ġeven": 1524, + "ason": 1525, + "uild": 1526, + "from": 1527, + "(d": 1528, + "Ġbl": 1529, + "label": 1530, + "else": 1531, + "е": 1532, + "Ġ(!": 1533, + "ized": 1534, + "(),": 1535, + "Ġob": 1536, + "Ġitem": 1537, + "ump": 1538, + "UR": 1539, + "orn": 1540, + "Ġdon": 1541, + "Se": 1542, + "man": 1543, + "27": 1544, + "ample": 1545, + "tn": 1546, + "================": 1547, + "He": 1548, + "gram": 1549, + "Ġdid": 1550, + "wn": 1551, + "_h": 1552, + "iver": 1553, + "Ġsm": 1554, + "Ġthrough": 1555, + "ĠAn": 1556, + "che": 1557, + "Ġinv": 1558, + "ouse": 1559, + "Ġes": 1560, + "ĠNew": 1561, + "export": 1562, + "mary": 1563, + "uto": 1564, + "ler": 1565, + "Ġlast": 1566, + "Ġevent": 1567, + "try": 1568, + "ï¼": 1569, + "ily": 1570, + "igned": 1571, + "ines": 1572, + "ollow": 1573, + "icense": 1574, + "sole": 1575, + "lear": 1576, + "(int": 1577, + "Ġagain": 1578, + "Ġhigh": 1579, + "html": 1580, + "Index": 1581, + "uthor": 1582, + "Ġ/**Ċ": 1583, + "Ġline": 1584, + "Event": 1585, + "_D": 1586, + "Ġdoes": 1587, + "itial": 1588, + "Ġcr": 1589, + "ars": 1590, + "28": 1591, + "Ġtem": 1592, + "cause": 1593, + "face": 1594, + "Ġ`": 1595, + "_A": 1596, + "Button": 1597, + "ature": 1598, + "ected": 1599, + "ES": 1600, + "ister": 1601, + "ĉĊ": 1602, + "Ġbefore": 1603, + "ale": 1604, + "other": 1605, + "Ġbecause": 1606, + "roid": 1607, + "Ġed": 1608, + "ik": 1609, + "reg": 1610, + "ĠDe": 1611, + "Ġdist": 1612, + "},Ċ": 1613, + "Ġstate": 1614, + "Ġcons": 1615, + "rint": 1616, + "att": 1617, + "Ġhere": 1618, + "ined": 1619, + "Ġfinal": 1620, + "Ġ\"\"": 1621, + "Key": 1622, + "LO": 1623, + "Ġdel": 1624, + "pty": 1625, + "thing": 1626, + "26": 1627, + "ĠAnd": 1628, + "Ġrun": 1629, + "ĠX": 1630, + "ym": 1631, + ".app": 1632, + "Ġvery": 1633, + "ces": 1634, + "_N": 1635, + "ared": 1636, + "ward": 1637, + "list": 1638, + "ited": 1639, + "olog": 1640, + "itch": 1641, + "Box": 1642, + "ife": 1643, + "33": 1644, + "Ġac": 1645, + "Ġmodel": 1646, + "Ġmon": 1647, + "Ġway": 1648, + "lete": 1649, + "Ġcall": 1650, + "Ġatt": 1651, + "Ġcal": 1652, + "vert": 1653, + "Ġdec": 1654, + "lease": 1655, + "oun": 1656, + "Ġ});Ċ": 1657, + "fr": 1658, + "formation": 1659, + "etail": 1660, + "Ġnum": 1661, + "aj": 1662, + "query": 1663, + "Ġwell": 1664, + "Ġobject": 1665, + "ĠAs": 1666, + "Ġyears": 1667, + "Color": 1668, + "IS": 1669, + "Ġdefault": 1670, + "Wh": 1671, + "Ġins": 1672, + "aint": 1673, + "Ġjava": 1674, + "Ġsim": 1675, + "ĠAr": 1676, + "mon": 1677, + "til": 1678, + "();čĊ": 1679, + "):": 1680, + "Set": 1681, + "29": 1682, + "atter": 1683, + "Ġview": 1684, + "Ġpres": 1685, + "array": 1686, + "We": 1687, + "At": 1688, + "Ġbel": 1689, + "Ġmany": 1690, + "21": 1691, + "Man": 1692, + "ender": 1693, + "Ġbeing": 1694, + "Ġgood": 1695, + "ĉĉĉĉĉĉ": 1696, + "ational": 1697, + "ware": 1698, + ".log": 1699, + "{čĊ": 1700, + "Ġusing": 1701, + "_B": 1702, + "Ġ:=": 1703, + "_w": 1704, + "ists": 1705, + "lish": 1706, + "Ġstud": 1707, + "ĠAl": 1708, + "Ġgu": 1709, + "config": 1710, + "uring": 1711, + "time": 1712, + "oken": 1713, + "amespace": 1714, + "Ġrequest": 1715, + "Ġchild": 1716, + "ĠÃ": 1717, + "lob": 1718, + "Ġparam": 1719, + "Ġ}čĊ": 1720, + "01": 1721, + "Ġecho": 1722, + "function": 1723, + "********************************": 1724, + "ps": 1725, + "Element": 1726, + "alk": 1727, + "lication": 1728, + "by": 1729, + "Size": 1730, + "rawing": 1731, + "Ġperson": 1732, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1733, + "\\n": 1734, + "object": 1735, + "ince": 1736, + "En": 1737, + "File": 1738, + "uf": 1739, + "ffect": 1740, + "AC": 1741, + "Ġstyle": 1742, + "summary": 1743, + "Ġque": 1744, + "_r": 1745, + "Ġ($": 1746, + "Model": 1747, + "ident": 1748, + "Ġmethod": 1749, + "IL": 1750, + "ott": 1751, + "less": 1752, + "ING": 1753, + "Ġ()": 1754, + "Ġexpect": 1755, + "ync": 1756, + "package": 1757, + "35": 1758, + "urs": 1759, + "Ġprot": 1760, + "./": 1761, + "pre": 1762, + "Ġ)Ċ": 1763, + "ma": 1764, + "Ġsur": 1765, + "Ġfound": 1766, + "Info": 1767, + "par": 1768, + "imes": 1769, + ".e": 1770, + "ains": 1771, + "Ġpost": 1772, + "-d": 1773, + "45": 1774, + "olean": 1775, + "Ġsl": 1776, + "PE": 1777, + "Ġsuch": 1778, + "select": 1779, + "ainer": 1780, + "Ġthink": 1781, + "Ġdiffer": 1782, + ".r": 1783, + "/**Ċ": 1784, + "FF": 1785, + "ool": 1786, + "plate": 1787, + "qual": 1788, + "ĠFor": 1789, + "Ġmuch": 1790, + "uc": 1791, + "(new": 1792, + "odule": 1793, + "Ġsom": 1794, + "Ġhttp": 1795, + "ĠList": 1796, + "Ġcount": 1797, + "Ġinst": 1798, + "char": 1799, + "mit": 1800, + ".id": 1801, + "aking": 1802, + "Ġgener": 1803, + "px": 1804, + "vice": 1805, + "37": 1806, + "_data": 1807, + "ĠNULL": 1808, + "}čĊ": 1809, + "idd": 1810, + "ãĢĤ": 1811, + "Ġmed": 1812, + "org": 1813, + "ider": 1814, + "ache": 1815, + "work": 1816, + "Ġcheck": 1817, + "ween": 1818, + "Ġ((": 1819, + "the": 1820, + "ants": 1821, + "><": 1822, + ".B": 1823, + "-c": 1824, + "Ġopen": 1825, + "Ġest": 1826, + "ĠĠĠĠĠĠĠĠĊ": 1827, + "Ġnext": 1828, + "IM": 1829, + "ÑĤ": 1830, + "OT": 1831, + "ó": 1832, + "Ġfollow": 1833, + "content": 1834, + "ĠĠĠĠĠĠĠĠĠĠĠĠ": 1835, + "Ġinclud": 1836, + "HE": 1837, + "ĠRes": 1838, + "Ġhref": 1839, + "и": 1840, + "Ġcar": 1841, + "ypes": 1842, + "image": 1843, + "Un": 1844, + "Ġbool": 1845, + "AD": 1846, + "Ġgame": 1847, + ".Form": 1848, + "rows": 1849, + "*/": 1850, + "velop": 1851, + ".Drawing": 1852, + "Ġpath": 1853, + "ision": 1854, + "Ġeach": 1855, + "ĠPl": 1856, + "_type": 1857, + "Path": 1858, + "nection": 1859, + "Ġav": 1860, + "').": 1861, + "Ġsupport": 1862, + "ENT": 1863, + "rem": 1864, + "\").": 1865, + "Ġown": 1866, + "Ġcor": 1867, + "count": 1868, + "miss": 1869, + "ually": 1870, + "Ġmem": 1871, + "std": 1872, + "ience": 1873, + "search": 1874, + "\"ĊĊ": 1875, + "Form": 1876, + "Ġsex": 1877, + "ename": 1878, + "Ġsign": 1879, + "Ġet": 1880, + "ĠĠĠĠĠĠĠĠĠĠ": 1881, + "','": 1882, + "ĠApp": 1883, + "Ġthose": 1884, + "off": 1885, + "Ġerr": 1886, + "Ġsystem": 1887, + "Ġbest": 1888, + "code": 1889, + "Ġsame": 1890, + "Ġdi": 1891, + "uss": 1892, + "Ġcreate": 1893, + "ather": 1894, + "Array": 1895, + ".in": 1896, + "fe": 1897, + "Service": 1898, + "UN": 1899, + "ats": 1900, + "ĠZ": 1901, + "alth": 1902, + "Ġmade": 1903, + "true": 1904, + "AB": 1905, + "Ġmark": 1906, + "rid": 1907, + "ified": 1908, + ",čĊ": 1909, + "yn": 1910, + "press": 1911, + "Ġgroup": 1912, + "Ġfin": 1913, + "ĠLicense": 1914, + "Field": 1915, + "eger": 1916, + "Ġworld": 1917, + "iness": 1918, + "ty": 1919, + "Ġprocess": 1920, + "(b": 1921, + "Ġcre": 1922, + "arn": 1923, + "ives": 1924, + "Ġmain": 1925, + "ideo": 1926, + "36": 1927, + "_g": 1928, + "AG": 1929, + "valid": 1930, + "img": 1931, + "PI": 1932, + "Ġcolor": 1933, + "Ġreport": 1934, + "Ġtake": 1935, + "rib": 1936, + "OM": 1937, + "Ġday": 1938, + "Request": 1939, + "Ġsk": 1940, + "bers": 1941, + "ĉs": 1942, + ".Add": 1943, + "oot": 1944, + "Image": 1945, + "Ġcomple": 1946, + "ollection": 1947, + "Ġtop": 1948, + "Ġfree": 1949, + "AS": 1950, + "De": 1951, + "ĠOn": 1952, + "IG": 1953, + "90": 1954, + "eta": 1955, + "Date": 1956, + "Ġaction": 1957, + "34": 1958, + "Over": 1959, + "itor": 1960, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1961, + "not": 1962, + "Ġindex": 1963, + "her": 1964, + "icon": 1965, + "On": 1966, + ";čĊčĊ": 1967, + "ivity": 1968, + "mand": 1969, + ".Windows": 1970, + "OL": 1971, + "Ġreal": 1972, + "Ġmax": 1973, + "land": 1974, + "....": 1975, + "raph": 1976, + "Ġbuild": 1977, + "leg": 1978, + "assword": 1979, + "?ĊĊ": 1980, + "âĢ¦": 1981, + "ook": 1982, + "uck": 1983, + "Ġmessage": 1984, + "test": 1985, + "ivers": 1986, + "38": 1987, + "Ġinput": 1988, + "Ġart": 1989, + "Ġbetween": 1990, + "Get": 1991, + "enter": 1992, + "ground": 1993, + "ene": 1994, + "á": 1995, + ".length": 1996, + "Node": 1997, + "(i": 1998, + "Class": 1999, + "for": 2000, + "ĠâĢĶ": 2001, + "ten": 2002, + "oin": 2003, + "Ġke": 2004, + "ui": 2005, + "ĠIN": 2006, + "Ġtable": 2007, + "sub": 2008, + "ĠLe": 2009, + "Ġhead": 2010, + "Ġmust": 2011, + "////////////////": 2012, + ".util": 2013, + "Context": 2014, + "Ġorder": 2015, + "Ġmov": 2016, + "over": 2017, + "Ġcontin": 2018, + "Ġsay": 2019, + "static": 2020, + ".Text": 2021, + "ĠclassName": 2022, + "pany": 2023, + "Ġter": 2024, + "head": 2025, + "rg": 2026, + "Ġproduct": 2027, + "This": 2028, + ".âĢĿ": 2029, + "ĠBut": 2030, + "70": 2031, + "loy": 2032, + "Ġdouble": 2033, + "sg": 2034, + "Ġplace": 2035, + ".x": 2036, + "message": 2037, + "Ġinformation": 2038, + "private": 2039, + "Ġoper": 2040, + "ced": 2041, + "db": 2042, + "\">": 2043, + "Param": 2044, + "icle": 2045, + "Ġweek": 2046, + "Ġprop": 2047, + "table": 2048, + "idget": 2049, + "place": 2050, + "Prop": 2051, + "ĠAll": 2052, + "els": 2053, + "box": 2054, + ".ĊĊĊĊ": 2055, + ".R": 2056, + "ĠTo": 2057, + "iter": 2058, + "Sh": 2059, + "uration": 2060, + "older": 2061, + "_list": 2062, + "come": 2063, + "Ġsw": 2064, + "ization": 2065, + "ĉfor": 2066, + "bl": 2067, + "Ġprogram": 2068, + "(e": 2069, + "ape": 2070, + "check": 2071, + ".Forms": 2072, + "Ġund": 2073, + "ategory": 2074, + "75": 2075, + "ags": 2076, + "Ġresponse": 2077, + "US": 2078, + "request": 2079, + "Ġstruct": 2080, + "escription": 2081, + "Ġcode": 2082, + "_H": 2083, + "uffer": 2084, + "Ġwithout": 2085, + "lobal": 2086, + "Manager": 2087, + "ilter": 2088, + "PO": 2089, + "ĉthis": 2090, + "option": 2091, + "Ġsol": 2092, + "Ġ===": 2093, + "akes": 2094, + "Controller": 2095, + "44": 2096, + "Message": 2097, + "Ġref": 2098, + "ever": 2099, + "ĠSo": 2100, + "aining": 2101, + ".append": 2102, + "Ġstill": 2103, + "Ġprovid": 2104, + "Ġassert": 2105, + "med": 2106, + "Ġcap": 2107, + "usiness": 2108, + "Ġrep": 2109, + "tings": 2110, + "ved": 2111, + ".N": 2112, + "api": 2113, + "OD": 2114, + "Ġfield": 2115, + "iven": 2116, + "oto": 2117, + "âĢľ": 2118, + "col": 2119, + "(x": 2120, + "ght": 2121, + "Result": 2122, + "Code": 2123, + ".is": 2124, + "link": 2125, + "Ġcour": 2126, + "An": 2127, + "Ġteam": 2128, + "ĉint": 2129, + "ift": 2130, + "55": 2131, + "Ġsecond": 2132, + "Ġgoing": 2133, + "Ġrange": 2134, + "_E": 2135, + "ness": 2136, + "39": 2137, + "Ġfam": 2138, + "Ġnil": 2139, + "ĠCont": 2140, + "ailable": 2141, + "utes": 2142, + "atab": 2143, + "Ġfact": 2144, + "Ġvis": 2145, + "(&": 2146, + "ĠAN": 2147, + "31": 2148, + "Al": 2149, + "title": 2150, + "Ġandroid": 2151, + "CE": 2152, + "\\\"": 2153, + "irt": 2154, + "Ġwrit": 2155, + "н": 2156, + "ĉm": 2157, + "ftware": 2158, + "ond": 2159, + "Ġret": 2160, + "osition": 2161, + "Ġhome": 2162, + "Ġleft": 2163, + "args": 2164, + "meric": 2165, + "48": 2166, + "Ġdirect": 2167, + "oci": 2168, + "Pl": 2169, + "As": 2170, + "ret": 2171, + "ado": 2172, + "Of": 2173, + "chn": 2174, + "ĠGet": 2175, + "ee": 2176, + "ross": 2177, + "();": 2178, + "____": 2179, + ".ph": 2180, + "It": 2181, + "oute": 2182, + "Ġexper": 2183, + "chool": 2184, + "www": 2185, + "},": 2186, + "Ġallow": 2187, + "ĠÂ": 2188, + "())": 2189, + "size": 2190, + "ism": 2191, + "ai": 2192, + "tract": 2193, + "ane": 2194, + "...ĊĊ": 2195, + "context": 2196, + "Ġbeg": 2197, + "CH": 2198, + "Ġpage": 2199, + "hip": 2200, + "no": 2201, + "core": 2202, + "sp": 2203, + "Ġdifferent": 2204, + "iable": 2205, + "ĠMe": 2206, + "_IN": 2207, + "button": 2208, + "ĠIs": 2209, + "ervices": 2210, + "Ġca": 2211, + "Ġaround": 2212, + "App": 2213, + "ration": 2214, + "Ġrece": 2215, + "Ġreally": 2216, + "Ġimage": 2217, + "Ġtarget": 2218, + "Ġdep": 2219, + "opyright": 2220, + "tra": 2221, + "ingle": 2222, + "ital": 2223, + "Layout": 2224, + "Ġboth": 2225, + "Override": 2226, + "arm": 2227, + "=>": 2228, + "aterial": 2229, + "iled": 2230, + "Ġput": 2231, + "Qu": 2232, + "ÑĢ": 2233, + "ung": 2234, + "map": 2235, + "ĉĉĉĉĉĉĉĉ": 2236, + "Ġlevel": 2237, + "Component": 2238, + "book": 2239, + "creen": 2240, + "_RE": 2241, + "Ġconfig": 2242, + "ãģ": 2243, + "Or": 2244, + ".data": 2245, + "Ġdocument": 2246, + "\",\"": 2247, + "tribute": 2248, + "ux": 2249, + "Log": 2250, + "ference": 2251, + "post": 2252, + "_e": 2253, + "Ġlocal": 2254, + "andom": 2255, + "assert": 2256, + "Val": 2257, + "lected": 2258, + "ina": 2259, + "atabase": 2260, + "Add": 2261, + "Ġcontent": 2262, + ".print": 2263, + "signed": 2264, + "ric": 2265, + ".\"ĊĊ": 2266, + "Ġfa": 2267, + "!ĊĊ": 2268, + "-f": 2269, + "ived": 2270, + "Ġquest": 2271, + ".ex": 2272, + "Ġfloat": 2273, + "Ġdevelop": 2274, + "оÐ": 2275, + "Map": 2276, + "ading": 2277, + "Ġposs": 2278, + "UE": 2279, + "namespace": 2280, + "_O": 2281, + "ĉb": 2282, + ".Get": 2283, + ">(": 2284, + "json": 2285, + "etails": 2286, + "66": 2287, + "Ġtoo": 2288, + "Ġextends": 2289, + "ĠNone": 2290, + "Ġfore": 2291, + "(String": 2292, + "format": 2293, + "Ġgreat": 2294, + "inter": 2295, + "cale": 2296, + "Ñģ": 2297, + "ron": 2298, + "iving": 2299, + "Ent": 2300, + "ency": 2301, + "xt": 2302, + "oy": 2303, + "05": 2304, + "Ġmonth": 2305, + "Ġhapp": 2306, + "Ġsuper": 2307, + "bar": 2308, + "default": 2309, + "_de": 2310, + "ords": 2311, + "ln": 2312, + "({Ċ": 2313, + "ĠInd": 2314, + "ases": 2315, + "Ġtitle": 2316, + "Ġcontext": 2317, + "08": 2318, + "oh": 2319, + "-p": 2320, + "Em": 2321, + "Ġmet": 2322, + "Test": 2323, + "Ġlife": 2324, + "_v": 2325, + "ĠUS": 2326, + "UI": 2327, + "ocation": 2328, + "md": 2329, + "Ġ[Ċ": 2330, + "Ġ]": 2331, + "sw": 2332, + "Ġincre": 2333, + "script": 2334, + "ential": 2335, + "ways": 2336, + ".de": 2337, + "Ġsrc": 2338, + "Ġcatch": 2339, + "ĠAmeric": 2340, + "//Ċ": 2341, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2342, + "Ġpay": 2343, + "plit": 2344, + "âĢĶ": 2345, + "Ġcoun": 2346, + "obj": 2347, + ".php": 2348, + "Ġchange": 2349, + "ething": 2350, + "'re": 2351, + "aster": 2352, + "los": 2353, + "lation": 2354, + "ĠĠĊ": 2355, + "Le": 2356, + "ä": 2357, + "({": 2358, + "ready": 2359, + "ĠNo": 2360, + "Ġposition": 2361, + "Ġold": 2362, + "Ġbook": 2363, + "abled": 2364, + "bug": 2365, + "202": 2366, + "Hand": 2367, + "};ĊĊ": 2368, + "isplay": 2369, + "aving": 2370, + "04": 2371, + "Ġgover": 2372, + "Ġversion": 2373, + "System": 2374, + "nect": 2375, + "response": 2376, + "Style": 2377, + "Up": 2378, + "angu": 2379, + "Ġthree": 2380, + "init": 2381, + "ero": 2382, + "Ġlaw": 2383, + "endif": 2384, + "Ġbase": 2385, + "email": 2386, + "(l": 2387, + "_V": 2388, + "Ġconf": 2389, + "ATE": 2390, + "Ġduring": 2391, + "tes": 2392, + "Ġconsole": 2393, + "ĠPr": 2394, + "Ġspe": 2395, + "ves": 2396, + "65": 2397, + "path": 2398, + "ialog": 2399, + "dition": 2400, + "_to": 2401, + "ards": 2402, + "Ġagainst": 2403, + "etwork": 2404, + "ĠPh": 2405, + "_L": 2406, + "cur": 2407, + "imit": 2408, + "With": 2409, + "Ġpower": 2410, + "ium": 2411, + "';ĊĊ": 2412, + "Ġwom": 2413, + "left": 2414, + "ources": 2415, + "atri": 2416, + "ĠIm": 2417, + "ĠMan": 2418, + "orth": 2419, + "${": 2420, + "88": 2421, + "quals": 2422, + "ese": 2423, + "_size": 2424, + "Ġiss": 2425, + "otal": 2426, + "-g": 2427, + "ique": 2428, + "rame": 2429, + "Ġwidth": 2430, + "erg": 2431, + ")(": 2432, + "ittle": 2433, + "TR": 2434, + "ĠThey": 2435, + "ences": 2436, + "02": 2437, + "rl": 2438, + "ons": 2439, + "Ġlabel": 2440, + ".y": 2441, + "-t": 2442, + "update": 2443, + "anel": 2444, + "sc": 2445, + ".to": 2446, + "Ġproject": 2447, + "ü": 2448, + "Ġelement": 2449, + "Ġsuccess": 2450, + "ĉĉĊ": 2451, + ".sh": 2452, + "ram": 2453, + "ched": 2454, + "())Ċ": 2455, + "Ġ(Ċ": 2456, + "Ġdate": 2457, + "Ġtot": 2458, + "_ST": 2459, + "All": 2460, + "ification": 2461, + "ĉvar": 2462, + "Ġtri": 2463, + "chem": 2464, + "my": 2465, + "Ġbig": 2466, + "ĠAd": 2467, + "ĠAt": 2468, + "ots": 2469, + "num": 2470, + "Act": 2471, + "Ġmap": 2472, + "era": 2473, + "cope": 2474, + ".$": 2475, + ",âĢĿ": 2476, + "Ġpop": 2477, + "Ġfew": 2478, + "Ġlen": 2479, + "uid": 2480, + "eters": 2481, + "ules": 2482, + "ÃŃ": 2483, + "source": 2484, + "https": 2485, + "Ġdem": 2486, + "Ġear": 2487, + "################": 2488, + "Ġmatch": 2489, + "ories": 2490, + "49": 2491, + "aces": 2492, + "ĠCl": 2493, + "Ġnode": 2494, + "78": 2495, + "irc": 2496, + "local": 2497, + "unity": 2498, + "};Ċ": 2499, + "Ġanother": 2500, + "<<": 2501, + "ogle": 2502, + "Ġsit": 2503, + "ework": 2504, + "TE": 2505, + ".I": 2506, + "NS": 2507, + "ology": 2508, + "ought": 2509, + ".Cont": 2510, + ">>": 2511, + "Ġcare": 2512, + "state": 2513, + "ĉprivate": 2514, + "Ġeffect": 2515, + "++)": 2516, + "_file": 2517, + "ending": 2518, + "Line": 2519, + "For": 2520, + "ior": 2521, + "ĠSc": 2522, + "Ġfun": 2523, + ".Size": 2524, + "ĉelse": 2525, + "])": 2526, + "start": 2527, + "vious": 2528, + "Ġ},": 2529, + "ours": 2530, + "Ġleg": 2531, + "Ġservice": 2532, + "Ġsince": 2533, + "iron": 2534, + "Label": 2535, + "Ġnon": 2536, + "Ġlos": 2537, + "iction": 2538, + "Ġfull": 2539, + "acter": 2540, + "board": 2541, + "gress": 2542, + "Ġturn": 2543, + "ither": 2544, + "09": 2545, + ".size": 2546, + "Ġbody": 2547, + "resh": 2548, + "eturn": 2549, + "199": 2550, + "(_": 2551, + "yles": 2552, + "ormal": 2553, + "pi": 2554, + "Ġsomething": 2555, + "!--": 2556, + "uint": 2557, + "Ġprodu": 2558, + "Ġstand": 2559, + "Ġproble": 2560, + "Ġavailable": 2561, + "mt": 2562, + "ĠBl": 2563, + "Ġ...": 2564, + "Ġblock": 2565, + "Input": 2566, + "Ġkeep": 2567, + "Count": 2568, + "open": 2569, + "Ġ['": 2570, + "Ġthrow": 2571, + "uilder": 2572, + "Action": 2573, + "Ġthings": 2574, + "True": 2575, + "Ġurl": 2576, + "ĠBo": 2577, + "printf": 2578, + "Ġred": 2579, + "js": 2580, + ".create": 2581, + "ĠOr": 2582, + "Status": 2583, + "Instance": 2584, + "Ġcontrol": 2585, + "Ġcome": 2586, + "Ġcustom": 2587, + "location": 2588, + "07": 2589, + "model": 2590, + "ĠčĊ": 2591, + "Ġsource": 2592, + "Ġeas": 2593, + ".out": 2594, + "]ĊĊ": 2595, + "oney": 2596, + "Ġawait": 2597, + "Ġpartic": 2598, + "AP": 2599, + "ublish": 2600, + "odes": 2601, + "_pro": 2602, + "ply": 2603, + "riter": 2604, + "Ġprov": 2605, + "Ġmill": 2606, + "HT": 2607, + "])Ċ": 2608, + "Ġchang": 2609, + "Ġask": 2610, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2611, + "Ġoutput": 2612, + "Ġemail": 2613, + "68": 2614, + ".push": 2615, + "Ġ}čĊčĊ": 2616, + "ination": 2617, + "47": 2618, + "atrix": 2619, + "Table": 2620, + "uccess": 2621, + "]);Ċ": 2622, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2623, + "Ġdisc": 2624, + "([": 2625, + "Ġbusiness": 2626, + "height": 2627, + ".html": 2628, + "ta": 2629, + "field": 2630, + "Ġrequired": 2631, + "_R": 2632, + "Ġgovern": 2633, + "}čĊčĊ": 2634, + "lex": 2635, + "500": 2636, + ".,": 2637, + "ĠSet": 2638, + "urch": 2639, + "///": 2640, + "ts": 2641, + "af": 2642, + "Ġmight": 2643, + "istory": 2644, + "Str": 2645, + "Ġnever": 2646, + "Response": 2647, + "arse": 2648, + "ada": 2649, + "ĠHow": 2650, + "Ġ*)": 2651, + "Ġ;": 2652, + "Ġhard": 2653, + "Ad": 2654, + "Ġintern": 2655, + "used": 2656, + "(data": 2657, + "mod": 2658, + "annel": 2659, + "Ġnp": 2660, + "ugg": 2661, + "Ġ/>Ċ": 2662, + "Ġcalled": 2663, + "body": 2664, + "Ġcho": 2665, + "(r": 2666, + "_set": 2667, + "ird": 2668, + "Ġ>=": 2669, + "Ġ};Ċ": 2670, + "Ġoptions": 2671, + "ĠGener": 2672, + "Ġheight": 2673, + "Point": 2674, + "You": 2675, + "ety": 2676, + "Click": 2677, + "Ġsmall": 2678, + "Ġide": 2679, + "Ġaccess": 2680, + "anguage": 2681, + "Ġprotected": 2682, + "Ġjob": 2683, + "ĠThere": 2684, + "Def": 2685, + "Ġaddress": 2686, + "Ġuint": 2687, + "Not": 2688, + "oo": 2689, + "aps": 2690, + "
&": 5909, + "CON": 5910, + "Ġrepl": 5911, + "Ġregular": 5912, + "Storage": 5913, + "ramework": 5914, + "Ġgoal": 5915, + "Ġtouch": 5916, + ".widget": 5917, + "Ġbuilt": 5918, + "des": 5919, + "Part": 5920, + "(re": 5921, + "Ġworth": 5922, + "hib": 5923, + "game": 5924, + "91": 5925, + "192": 5926, + "Ġв": 5927, + "acion": 5928, + "ĠWhite": 5929, + "(type": 5930, + "(`": 5931, + "81": 5932, + "Ġnatural": 5933, + "Ġinj": 5934, + "Ġcalcul": 5935, + "ĠApril": 5936, + ".List": 5937, + "Ġassociated": 5938, + "ĉSystem": 5939, + "~~": 5940, + "=[": 5941, + "Ġstorage": 5942, + "Ġbytes": 5943, + "Ġtravel": 5944, + "Ġsou": 5945, + "Ġpassed": 5946, + "!=": 5947, + "ascript": 5948, + ".open": 5949, + "Ġgrid": 5950, + "Ġbus": 5951, + "Ġrecogn": 5952, + "Ab": 5953, + "Ġhon": 5954, + "ĠCenter": 5955, + "Ġprec": 5956, + "build": 5957, + "73": 5958, + "HTML": 5959, + "ĠSan": 5960, + "Ġcountries": 5961, + "aled": 5962, + "token": 5963, + "kt": 5964, + "Ġqual": 5965, + "Last": 5966, + "adow": 5967, + "Ġmanufact": 5968, + "idad": 5969, + "jango": 5970, + "Next": 5971, + "xf": 5972, + ".a": 5973, + "Ġporno": 5974, + "ĠPM": 5975, + "erve": 5976, + "iting": 5977, + "_th": 5978, + "ci": 5979, + "=None": 5980, + "gs": 5981, + "Ġlogin": 5982, + "atives": 5983, + "']);Ċ": 5984, + "Äħ": 5985, + "Ġill": 5986, + "IA": 5987, + "children": 5988, + "DO": 5989, + "Ġlevels": 5990, + "Ġ{{": 5991, + "Ġlooks": 5992, + "Ġ\"#": 5993, + "ToString": 5994, + "Ġnecessary": 5995, + "ĠĠĠĊ": 5996, + "cell": 5997, + "Entry": 5998, + "Ġ'#": 5999, + "Ġextrem": 6000, + "Selector": 6001, + "Ġplaceholder": 6002, + "Load": 6003, + "Ġreleased": 6004, + "ORE": 6005, + "Enumer": 6006, + "ĠTV": 6007, + "SET": 6008, + "inq": 6009, + "Press": 6010, + "ĠDepartment": 6011, + "Ġproperties": 6012, + "Ġrespond": 6013, + "Search": 6014, + "ael": 6015, + "Ġrequ": 6016, + "ĠBook": 6017, + "/Ċ": 6018, + "(st": 6019, + "Ġfinancial": 6020, + "icket": 6021, + "_input": 6022, + "Ġthreat": 6023, + "(in": 6024, + "Strip": 6025, + "ìĿ": 6026, + "ção": 6027, + "71": 6028, + "Ġevidence": 6029, + "));": 6030, + "ĠBro": 6031, + "Ġ[];Ċ": 6032, + "Ġou": 6033, + "buf": 6034, + "Script": 6035, + "dat": 6036, + "Ġrule": 6037, + "#import": 6038, + "=\"/": 6039, + "Serial": 6040, + "Ġstarting": 6041, + "[index": 6042, + "ae": 6043, + "Ġcontrib": 6044, + "session": 6045, + "_new": 6046, + "utable": 6047, + "ober": 6048, + "Ġ\"./": 6049, + "Ġlogger": 6050, + "Ġrecently": 6051, + "Ġreturned": 6052, + "ččĊ": 6053, + ")))Ċ": 6054, + "itions": 6055, + "Ġseek": 6056, + "Ġcommunic": 6057, + "Ġ\".": 6058, + "Ġusername": 6059, + "ECT": 6060, + "DS": 6061, + "Ġotherwise": 6062, + "ĠGerman": 6063, + ".aw": 6064, + "Adapter": 6065, + "ixel": 6066, + "Ġsystems": 6067, + "Ġdrop": 6068, + "83": 6069, + "Ġstructure": 6070, + "Ġ$(\"#": 6071, + "encies": 6072, + "anning": 6073, + "ĠLink": 6074, + "ĠResponse": 6075, + "Ġstri": 6076, + "ż": 6077, + "ĠDB": 6078, + "æĹ": 6079, + "android": 6080, + "submit": 6081, + "otion": 6082, + "92": 6083, + "(@": 6084, + ".test": 6085, + "82": 6086, + "ĊĊĊĊĊĊĊĊ": 6087, + "];čĊ": 6088, + "Ġdirectly": 6089, + "Ġ\"%": 6090, + "ris": 6091, + "elta": 6092, + "AIL": 6093, + "){čĊ": 6094, + "mine": 6095, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 6096, + "(k": 6097, + "bon": 6098, + "asic": 6099, + "pite": 6100, + "___": 6101, + "Max": 6102, + "Ġerrors": 6103, + "ĠWhile": 6104, + "Ġarguments": 6105, + "Ġensure": 6106, + "Right": 6107, + "-based": 6108, + "Web": 6109, + "Ġ-=": 6110, + "Ġintrodu": 6111, + "ĠInst": 6112, + "ĠWash": 6113, + "ordin": 6114, + "join": 6115, + "Database": 6116, + "Ġgrad": 6117, + "Ġusually": 6118, + "ITE": 6119, + "Props": 6120, + "?>Ċ": 6121, + "ĠGo": 6122, + "@Override": 6123, + "REF": 6124, + "Ġip": 6125, + "ĠAustral": 6126, + "Ġist": 6127, + "ViewById": 6128, + "Ġserious": 6129, + "Ġcustomer": 6130, + ".prototype": 6131, + "odo": 6132, + "cor": 6133, + "Ġdoor": 6134, + "ĠWITHOUT": 6135, + "Ġplant": 6136, + "Ġbegan": 6137, + "Ġdistance": 6138, + "()).": 6139, + "Ġchance": 6140, + "Ġord": 6141, + "came": 6142, + "pragma": 6143, + "Ġprotect": 6144, + "ragment": 6145, + "ĠNode": 6146, + "ening": 6147, + "Ñĩ": 6148, + "Ġroute": 6149, + "ĠSchool": 6150, + "hi": 6151, + "Ġneighb": 6152, + "After": 6153, + "licit": 6154, + "Ġcontr": 6155, + "Ġprimary": 6156, + "AA": 6157, + ".WriteLine": 6158, + "utils": 6159, + "Ġbi": 6160, + "Red": 6161, + ".Linq": 6162, + ".object": 6163, + "Ġleaders": 6164, + "unities": 6165, + "Ġgun": 6166, + "onth": 6167, + "ĠDev": 6168, + "FILE": 6169, + "Ġcomments": 6170, + "_len": 6171, + "arrow": 6172, + "amount": 6173, + "Range": 6174, + "sert": 6175, + "GridView": 6176, + "Ġupdated": 6177, + "ĠMo": 6178, + "Ġinform": 6179, + "ociety": 6180, + "ala": 6181, + "Access": 6182, + "Ġhab": 6183, + "Ġcreat": 6184, + "_arg": 6185, + "ĠJanuary": 6186, + "ĠDay": 6187, + "\")čĊ": 6188, + "uple": 6189, + "document": 6190, + "gorith": 6191, + "menu": 6192, + "ĠOver": 6193, + "bb": 6194, + ".title": 6195, + "_out": 6196, + "Ġled": 6197, + "uri": 6198, + "Ġ?>": 6199, + "gl": 6200, + "Ġbank": 6201, + "ayment": 6202, + "ĉprintf": 6203, + "MD": 6204, + "Ġsample": 6205, + "Ġhands": 6206, + "ĠVersion": 6207, + "uario": 6208, + "Ġoffers": 6209, + "ityEngine": 6210, + "Ġshape": 6211, + "Ġsleep": 6212, + "_point": 6213, + "Settings": 6214, + "Ġachie": 6215, + "Ġsold": 6216, + "ota": 6217, + ".bind": 6218, + "Am": 6219, + "Ġsafe": 6220, + "Store": 6221, + "Ġshared": 6222, + "Ġpriv": 6223, + "_VAL": 6224, + "Ġsens": 6225, + "){": 6226, + "Ġremember": 6227, + "shared": 6228, + "element": 6229, + "Ġshoot": 6230, + "Vert": 6231, + "cout": 6232, + "Ġenv": 6233, + "_label": 6234, + "Ġ>Ċ": 6235, + "run": 6236, + "Ġscene": 6237, + "(array": 6238, + "device": 6239, + "_title": 6240, + "agon": 6241, + "]čĊ": 6242, + "aby": 6243, + "Ġbecame": 6244, + "boolean": 6245, + "Ġpark": 6246, + "ĠCode": 6247, + "upload": 6248, + "riday": 6249, + "ĠSeptember": 6250, + "Fe": 6251, + "Ġsen": 6252, + "cing": 6253, + "FL": 6254, + "Col": 6255, + "uts": 6256, + "_page": 6257, + "inn": 6258, + "Ġimplied": 6259, + "aling": 6260, + "Ġyourself": 6261, + ".Count": 6262, + "conf": 6263, + "Ġaud": 6264, + "_init": 6265, + ".)": 6266, + "Ġwrote": 6267, + "003": 6268, + "NG": 6269, + ".Error": 6270, + "ä»": 6271, + ".for": 6272, + "Ġequal": 6273, + "ĠRequest": 6274, + "Ġserial": 6275, + "Ġallows": 6276, + "XX": 6277, + "Ġmiddle": 6278, + "chor": 6279, + "195": 6280, + "94": 6281, + "ø": 6282, + "erval": 6283, + ".Column": 6284, + "reading": 6285, + "Ġescort": 6286, + "ĠAugust": 6287, + "Ġquickly": 6288, + "Ġweap": 6289, + "ĠCG": 6290, + "ropri": 6291, + "ho": 6292, + "Ġcop": 6293, + "(struct": 6294, + "ĠBig": 6295, + "Ġvs": 6296, + "Ġfrequ": 6297, + ".Value": 6298, + "Ġactions": 6299, + "Ġproper": 6300, + "Ġinn": 6301, + "Ġobjects": 6302, + "Ġmatrix": 6303, + "avascript": 6304, + "Ġones": 6305, + ".group": 6306, + "Ġgreen": 6307, + "Ġpaint": 6308, + "ools": 6309, + "ycl": 6310, + "encode": 6311, + "olt": 6312, + "comment": 6313, + ".api": 6314, + "Dir": 6315, + "Ġune": 6316, + "izont": 6317, + ".position": 6318, + "Ġdesigned": 6319, + "_val": 6320, + "avi": 6321, + "iring": 6322, + "tab": 6323, + "Ġlayer": 6324, + "Ġviews": 6325, + "Ġreve": 6326, + "rael": 6327, + "ĠON": 6328, + "rics": 6329, + "160": 6330, + "np": 6331, + "Ġcore": 6332, + "());čĊ": 6333, + "Main": 6334, + "Ġexpert": 6335, + "ĉĉčĊ": 6336, + "_en": 6337, + "Ġ/>": 6338, + "utter": 6339, + "IAL": 6340, + "ails": 6341, + "ĠKing": 6342, + "*/ĊĊ": 6343, + "ĠMet": 6344, + "_end": 6345, + "addr": 6346, + "ora": 6347, + "Ġir": 6348, + "Min": 6349, + "Ġsurpr": 6350, + "Ġrepe": 6351, + "Ġdirectory": 6352, + "PUT": 6353, + "-S": 6354, + "Ġelection": 6355, + "haps": 6356, + ".pre": 6357, + "cm": 6358, + "Values": 6359, + "Ġ\"Ċ": 6360, + "column": 6361, + "ivil": 6362, + "Login": 6363, + "inue": 6364, + "93": 6365, + "Ġbeautiful": 6366, + "Ġsecret": 6367, + "(event": 6368, + "Ġchat": 6369, + "ums": 6370, + "Ġorigin": 6371, + "Ġeffects": 6372, + "Ġmanagement": 6373, + "illa": 6374, + "tk": 6375, + "Ġsetting": 6376, + "ĠCour": 6377, + "Ġmassage": 6378, + "ĉend": 6379, + "Ġhappy": 6380, + "Ġfinish": 6381, + "Ġcamera": 6382, + "ĠVer": 6383, + "ĠDemocr": 6384, + "ĠHer": 6385, + "(Q": 6386, + "cons": 6387, + "ita": 6388, + "Ġ'.": 6389, + "{}": 6390, + "ĉC": 6391, + "Ġstuff": 6392, + "194": 6393, + "Ġ:Ċ": 6394, + "ĠAR": 6395, + "Task": 6396, + "hidden": 6397, + "eros": 6398, + "IGN": 6399, + "atio": 6400, + "ĠHealth": 6401, + "olute": 6402, + "Enter": 6403, + "'>": 6404, + "ĠTwitter": 6405, + "ĠCounty": 6406, + "scribe": 6407, + "Ġ=>Ċ": 6408, + "Ġhy": 6409, + "fit": 6410, + "Ġmilitary": 6411, + "Ġsale": 6412, + "required": 6413, + "non": 6414, + "bootstrap": 6415, + "hold": 6416, + "rim": 6417, + "-old": 6418, + "ĠDown": 6419, + "Ġmention": 6420, + "contact": 6421, + "_group": 6422, + "oday": 6423, + "Ġtown": 6424, + "Ġsolution": 6425, + "uate": 6426, + "elling": 6427, + "]->": 6428, + "otes": 6429, + "ental": 6430, + "omen": 6431, + "ospital": 6432, + "ĠSup": 6433, + "_EN": 6434, + "Ġslow": 6435, + "SESSION": 6436, + "Ġblue": 6437, + "ago": 6438, + "Ġlives": 6439, + "Ġ^": 6440, + ".un": 6441, + "inst": 6442, + "enge": 6443, + "Ġcustomers": 6444, + "Ġcast": 6445, + "udget": 6446, + "ï¼ģ": 6447, + "icens": 6448, + "Ġdetermin": 6449, + "Selected": 6450, + "_pl": 6451, + "ueue": 6452, + "Ġdark": 6453, + "//ĊĊ": 6454, + "si": 6455, + "thern": 6456, + "ĠJapan": 6457, + "/w": 6458, + "PU": 6459, + "ĠEast": 6460, + "ovie": 6461, + "Ġpackage": 6462, + "Ġnor": 6463, + "Ġapi": 6464, + "bot": 6465, + "\"];Ċ": 6466, + "_post": 6467, + "ulate": 6468, + "Ġclub": 6469, + "'));Ċ": 6470, + "Ġloop": 6471, + "PIO": 6472, + "ione": 6473, + "shot": 6474, + "Initial": 6475, + "Ġplayed": 6476, + "register": 6477, + "rought": 6478, + "_max": 6479, + "acement": 6480, + "match": 6481, + "raphics": 6482, + "AST": 6483, + "Ġexisting": 6484, + "Ġcomplex": 6485, + "DA": 6486, + ".Ch": 6487, + ".common": 6488, + "mo": 6489, + "Ġ'../../": 6490, + "ito": 6491, + "Ġanalysis": 6492, + "Ġdeliver": 6493, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6494, + "idx": 6495, + "Ãł": 6496, + "ongo": 6497, + "ĠEnglish": 6498, + "Ċ": 10197, + "_default": 10198, + "ĠDatabase": 10199, + "rep": 10200, + "ESS": 10201, + "nergy": 10202, + ".Find": 10203, + "_mask": 10204, + "Ġrise": 10205, + "Ġkernel": 10206, + "::$": 10207, + ".Q": 10208, + "Ġoffering": 10209, + "decl": 10210, + "ĠCS": 10211, + "Ġlisted": 10212, + "Ġmostly": 10213, + "enger": 10214, + "Ġblocks": 10215, + "olo": 10216, + "Ġgoverning": 10217, + "\\F": 10218, + "Ġconcent": 10219, + ".getText": 10220, + "Ġmb": 10221, + "Ġoccurred": 10222, + "Ġchanging": 10223, + "Scene": 10224, + "_CODE": 10225, + "Beh": 10226, + "\"The": 10227, + "Ġtile": 10228, + "ĠAssociation": 10229, + "ĉP": 10230, + "alty": 10231, + "_ad": 10232, + "odies": 10233, + "iated": 10234, + "Ġprepared": 10235, + "possible": 10236, + "Ġmort": 10237, + "TEST": 10238, + "142": 10239, + "Ġignore": 10240, + "Ġcalc": 10241, + "Ġrs": 10242, + "ĠassertEquals": 10243, + "Ġsz": 10244, + "ĠTHIS": 10245, + ".\"Ċ": 10246, + "Ġcanvas": 10247, + "java": 10248, + "Ġdut": 10249, + "VALID": 10250, + ".sql": 10251, + ".input": 10252, + "Ġaux": 10253, + "Sup": 10254, + "Ġartist": 10255, + "Vec": 10256, + "_TIME": 10257, + ".stringify": 10258, + "etween": 10259, + "ĠCategory": 10260, + "Ġ[-": 10261, + "ĠDevExpress": 10262, + "ĠJul": 10263, + "Ġring": 10264, + ".ed": 10265, + "YY": 10266, + "Let": 10267, + "TextField": 10268, + "Ġflat": 10269, + "_print": 10270, + "ĠOTHER": 10271, + "adian": 10272, + "Ġchecked": 10273, + "ele": 10274, + "Align": 10275, + "standing": 10276, + "Ġ[],": 10277, + "Ġlab": 10278, + "ucky": 10279, + "ĠChristmas": 10280, + "(image": 10281, + ".module": 10282, + "Ġlots": 10283, + "Ġslightly": 10284, + "(final": 10285, + "erge": 10286, + "è¿": 10287, + "147": 10288, + "ĠPolice": 10289, + "143": 10290, + "ĠRight": 10291, + "Ġaward": 10292, + "ĠOS": 10293, + "Ġ{}ĊĊ": 10294, + "Ġptr": 10295, + "oves": 10296, + "icated": 10297, + "ем": 10298, + "Ġmanage": 10299, + "oliday": 10300, + "Amount": 10301, + "oolStrip": 10302, + "tbody": 10303, + "Nav": 10304, + "wrap": 10305, + "BB": 10306, + "Ġwatching": 10307, + "arios": 10308, + "Ġoptional": 10309, + "_K": 10310, + "ĠLicensed": 10311, + ".Map": 10312, + "Timer": 10313, + "ĠAP": 10314, + "ĠRev": 10315, + "(o": 10316, + ",c": 10317, + "umin": 10318, + "etailed": 10319, + "ĠHy": 10320, + "Ġblank": 10321, + "agger": 10322, + "ĠSelf": 10323, + "()[": 10324, + ".make": 10325, + "earn": 10326, + "channel": 10327, + ";Ċ": 10342, + "World": 10343, + "Ġpython": 10344, + "Ġlif": 10345, + "Ġtrav": 10346, + "Ġconven": 10347, + "company": 10348, + "ĠClub": 10349, + "138": 10350, + "Ver": 10351, + "Btn": 10352, + "Ġzone": 10353, + "products": 10354, + "ĠEduc": 10355, + "Ġverify": 10356, + "ĠMil": 10357, + "ono": 10358, + "]);ĊĊ": 10359, + "ENCE": 10360, + "Ġpacket": 10361, + "Ġcer": 10362, + "Ġenumer": 10363, + "Ġpars": 10364, + "formed": 10365, + "Ġoccup": 10366, + "tre": 10367, + "Ġexercise": 10368, + "Day": 10369, + "_sum": 10370, + "Ġasking": 10371, + "aption": 10372, + "Ġorders": 10373, + "Ġspending": 10374, + "ĠERR": 10375, + ".Dis": 10376, + "ĠUtil": 10377, + "âĢľI": 10378, + "\\'": 10379, + "?)": 10380, + "/>Ċ": 10381, + "Ġemot": 10382, + "Ġinfluence": 10383, + "ĠAfrica": 10384, + "atters": 10385, + "Ùħ": 10386, + ".session": 10387, + "Ġchief": 10388, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10389, + "Ġtom": 10390, + "cluded": 10391, + "serial": 10392, + "_handler": 10393, + ".Type": 10394, + "aped": 10395, + "Ġpolicies": 10396, + "-ex": 10397, + "-tr": 10398, + "blank": 10399, + "merce": 10400, + "Ġcoverage": 10401, + "Ġrc": 10402, + "_matrix": 10403, + "_box": 10404, + "Ġcharges": 10405, + "ĠBoston": 10406, + "Pe": 10407, + "Ġcircum": 10408, + "Ġfilled": 10409, + "148": 10410, + "Ġnorth": 10411, + "ictureBox": 10412, + "ĉres": 10413, + "è®": 10414, + "Ġtermin": 10415, + "Ġ[âĢ¦": 10416, + "IRECT": 10417, + "Ġber": 10418, + "Ġ\"../../": 10419, + "retch": 10420, + ".code": 10421, + "_col": 10422, + "ĠGovernment": 10423, + "Ġargv": 10424, + "ĠLord": 10425, + "asi": 10426, + "Exec": 10427, + "ĉlet": 10428, + "vertis": 10429, + "Ġdiscussion": 10430, + "enance": 10431, + "outube": 10432, + "typeof": 10433, + "Ġserved": 10434, + "ĠPut": 10435, + "ĉx": 10436, + "Ġsweet": 10437, + "Before": 10438, + "ategy": 10439, + ".of": 10440, + "ĠMaterial": 10441, + "Sort": 10442, + "ONT": 10443, + "igital": 10444, + "Why": 10445, + "Ġsust": 10446, + "Ġç": 10447, + "abet": 10448, + "Ġsegment": 10449, + "Ġ[],Ċ": 10450, + "ĠMuslim": 10451, + "ĠfindViewById": 10452, + "cut": 10453, + "_TEXT": 10454, + "ĠMary": 10455, + "Ġloved": 10456, + "Ġlie": 10457, + "ĠJO": 10458, + "Ġisset": 10459, + "month": 10460, + "Ġprime": 10461, + "ti": 10462, + "ĠCarol": 10463, + "Use": 10464, + "146": 10465, + "ĠPop": 10466, + "ĠSave": 10467, + "Interval": 10468, + "execute": 10469, + "dy": 10470, + "ĠIran": 10471, + "_cont": 10472, + "ĉT": 10473, + "Ġphase": 10474, + "checkbox": 10475, + "week": 10476, + "Ġhide": 10477, + "Ġtil": 10478, + "Ġju": 10479, + "Custom": 10480, + "burg": 10481, + "/M": 10482, + "TON": 10483, + "Ġquant": 10484, + "Ġrub": 10485, + "ixels": 10486, + "Ġinstalled": 10487, + "Ġdump": 10488, + "Ġproperly": 10489, + "(List": 10490, + "Ġdecide": 10491, + "apply": 10492, + "Has": 10493, + "Ġkeeping": 10494, + "Ġcitizens": 10495, + "Ġjoint": 10496, + "pool": 10497, + "Socket": 10498, + "_op": 10499, + "Ġweapon": 10500, + "gnore": 10501, + "ĠExec": 10502, + "otten": 10503, + "ĠMS": 10504, + "Ġ(-": 10505, + "ĠReview": 10506, + "Ġexamples": 10507, + "Ġtight": 10508, + "!(": 10509, + "DP": 10510, + "ĠMessageBox": 10511, + "Ġphotograph": 10512, + "164": 10513, + "URI": 10514, + "ét": 10515, + "low": 10516, + "ĠGrand": 10517, + ".persistence": 10518, + "Ġmaintain": 10519, + "Ġnums": 10520, + "Ġzip": 10521, + "ials": 10522, + "ĠGets": 10523, + "peg": 10524, + "ĠBuffer": 10525, + "~~~~": 10526, + "rastructure": 10527, + "ĠPL": 10528, + "uen": 10529, + "obby": 10530, + "sizeof": 10531, + "Ġpic": 10532, + "Ġseed": 10533, + "Ġexperienced": 10534, + "Ġodd": 10535, + "Ġkick": 10536, + "Ġprocedure": 10537, + "avigator": 10538, + "-on": 10539, + ",j": 10540, + "ĠAlthough": 10541, + "ĠuserId": 10542, + "accept": 10543, + "Blue": 10544, + "IColor": 10545, + "layer": 10546, + "available": 10547, + "Ġends": 10548, + ".table": 10549, + "Ġdataset": 10550, + "bus": 10551, + "Ġexplain": 10552, + "(pro": 10553, + "ĠCommittee": 10554, + "Ġnoted": 10555, + "]:Ċ": 10556, + "Dim": 10557, + "stdio": 10558, + "154": 10559, + ".\",Ċ": 10560, + "_source": 10561, + "181": 10562, + "ĠWeek": 10563, + "ĠEdge": 10564, + "Ġoperating": 10565, + "Ġeste": 10566, + "ipl": 10567, + "330": 10568, + "agination": 10569, + "Ġproceed": 10570, + "Ġanimation": 10571, + ".Models": 10572, + "ĠWatch": 10573, + "iat": 10574, + "Ġoppon": 10575, + "/A": 10576, + "Report": 10577, + "Ġsounds": 10578, + "_buf": 10579, + "IELD": 10580, + "Ġbund": 10581, + "ĉget": 10582, + ".pr": 10583, + "(tmp": 10584, + "Ġkid": 10585, + ">ĊĊĊ": 10586, + "Ġyang": 10587, + "NotFound": 10588, + "ÑĨ": 10589, + "math": 10590, + "@gmail": 10591, + "ĠLIMIT": 10592, + "redients": 10593, + "Ġvent": 10594, + "avigate": 10595, + "Look": 10596, + "Ġreligious": 10597, + "Ġrand": 10598, + "rio": 10599, + "(GL": 10600, + "_ip": 10601, + "uan": 10602, + "iciency": 10603, + "ĠChange": 10604, + ">čĊčĊ": 10605, + "ĠEntity": 10606, + "Ġrencontre": 10607, + "ĠRet": 10608, + "plan": 10609, + "én": 10610, + "BOOL": 10611, + "uries": 10612, + "train": 10613, + "Definition": 10614, + "============": 10615, + "zz": 10616, + "450": 10617, + "Animation": 10618, + "ĠOK": 10619, + "_menu": 10620, + ".bl": 10621, + "_score": 10622, + "Ġacad": 10623, + "(System": 10624, + "Ġrefresh": 10625, + "'=>$": 10626, + ".Graphics": 10627, + "amento": 10628, + "pid": 10629, + "tc": 10630, + "Ġtips": 10631, + "Ġhomes": 10632, + "Ġfuel": 10633, + "âĸ": 10634, + "_helper": 10635, + "ĠĠčĊ": 10636, + "ĠRoom": 10637, + ".Close": 10638, + "_attr": 10639, + "ĠMount": 10640, + "ĠEv": 10641, + "arser": 10642, + "_top": 10643, + "eah": 10644, + "ĠDelete": 10645, + "ãĢį": 10646, + "uke": 10647, + "Ġusage": 10648, + "aria": 10649, + "_dev": 10650, + "Ġtexture": 10651, + "Ġconversation": 10652, + "eper": 10653, + "Bean": 10654, + "done": 10655, + "nonatomic": 10656, + "ĠSecond": 10657, + "Ġshooting": 10658, + "_pre": 10659, + "Components": 10660, + "Ġ]ĊĊ": 10661, + "__,": 10662, + "stitution": 10663, + ".Char": 10664, + ">();ĊĊ": 10665, + "Ġpresented": 10666, + "Ġwa": 10667, + "oker": 10668, + "-ĊĊ": 10669, + "iner": 10670, + "Ġbecoming": 10671, + "Ġincident": 10672, + "Att": 10673, + "162": 10674, + "Ġrevealed": 10675, + "forc": 10676, + "Ġboot": 10677, + ".page": 10678, + "Enumerator": 10679, + "165": 10680, + "_->": 10681, + "Photo": 10682, + "Ġspring": 10683, + ".\",": 10684, + "ĠDictionary": 10685, + "BJECT": 10686, + "Ġlocations": 10687, + "Ġsamples": 10688, + "InputStream": 10689, + "ĠBrown": 10690, + "Ġstats": 10691, + "quality": 10692, + "Ñħ": 10693, + "-dis": 10694, + "Ġhelping": 10695, + "Ġped": 10696, + "224": 10697, + "(se": 10698, + "ĠWho": 10699, + "alian": 10700, + "internal": 10701, + "Ġft": 10702, + ">().": 10703, + "->{": 10704, + "Ġmine": 10705, + "Ġsector": 10706, + "Ġgro": 10707, + "Ġopportunities": 10708, + "Ġü": 10709, + "Ġmp": 10710, + "Ġalleged": 10711, + "Ġdoubt": 10712, + "Mouse": 10713, + "About": 10714, + "_part": 10715, + "Ġchair": 10716, + "Ġstopped": 10717, + "161": 10718, + "loop": 10719, + "entities": 10720, + "Ġapps": 10721, + "ansion": 10722, + "Ġmental": 10723, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10724, + "FR": 10725, + "Ġdefend": 10726, + "care": 10727, + "Ġideal": 10728, + "/api": 10729, + "urface": 10730, + "011": 10731, + "Ġele": 10732, + "ulator": 10733, + "ĠRights": 10734, + "anguages": 10735, + "Ġfunds": 10736, + "Ġadapt": 10737, + "Attributes": 10738, + "Ġdeploy": 10739, + "opts": 10740, + "Ġvalidation": 10741, + "Ġconcerns": 10742, + "uce": 10743, + ".num": 10744, + "ulture": 10745, + "ila": 10746, + "Ġcup": 10747, + "Ġpure": 10748, + ".Fore": 10749, + "183": 10750, + "ĠHashMap": 10751, + ".valueOf": 10752, + "asm": 10753, + "MO": 10754, + "Ġcs": 10755, + "Ġstores": 10756, + "Ġ************************************************************************": 10757, + "Ġcommunication": 10758, + "mem": 10759, + ".EventHandler": 10760, + ".Status": 10761, + "_right": 10762, + ".setOn": 10763, + "Sheet": 10764, + "Ġidentify": 10765, + "enerated": 10766, + "ordered": 10767, + "Ġ\"[": 10768, + "Ġswe": 10769, + "Condition": 10770, + "ĠAccording": 10771, + "Ġprepare": 10772, + "Ġrob": 10773, + "Pool": 10774, + "Ġsport": 10775, + "rv": 10776, + "ĠRouter": 10777, + "Ġalternative": 10778, + "([]": 10779, + "ĠChicago": 10780, + "ipher": 10781, + "ische": 10782, + "ĠDirector": 10783, + "kl": 10784, + "ĠWil": 10785, + "keys": 10786, + "Ġmysql": 10787, + "Ġwelcome": 10788, + "king": 10789, + "ĠManager": 10790, + "Ġcaught": 10791, + ")}Ċ": 10792, + "Score": 10793, + "_PR": 10794, + "Ġsurvey": 10795, + "hab": 10796, + "Headers": 10797, + "ADER": 10798, + "Ġdecor": 10799, + "Ġturns": 10800, + "Ġradius": 10801, + "errupt": 10802, + "Cor": 10803, + "Ġmel": 10804, + "Ġintr": 10805, + "(q": 10806, + "ĠAC": 10807, + "amos": 10808, + "MAX": 10809, + "ĠGrid": 10810, + "ĠJesus": 10811, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10812, + ".DE": 10813, + "Ġts": 10814, + "Ġlinked": 10815, + "free": 10816, + "ĠQt": 10817, + "Ġ/**čĊ": 10818, + "Ġfaster": 10819, + "ctr": 10820, + "_J": 10821, + "DT": 10822, + ".Check": 10823, + "Ġcombination": 10824, + "Ġintended": 10825, + "-the": 10826, + "-type": 10827, + "182": 10828, + "ectors": 10829, + "ami": 10830, + "uting": 10831, + "Ġuma": 10832, + "XML": 10833, + "UCT": 10834, + "Ap": 10835, + "ĠRandom": 10836, + "Ġran": 10837, + ".sort": 10838, + "Ġsorted": 10839, + ".Un": 10840, + "401": 10841, + "_PER": 10842, + "itory": 10843, + "Ġpriority": 10844, + "ĠGal": 10845, + "ĠOld": 10846, + "hot": 10847, + "ĠDisplay": 10848, + "(sub": 10849, + "_TH": 10850, + "_Y": 10851, + "ĠCare": 10852, + "loading": 10853, + "Kind": 10854, + "_handle": 10855, + ",,": 10856, + "rase": 10857, + "_replace": 10858, + ".addEventListener": 10859, + "ĠRT": 10860, + "172": 10861, + "Ġentered": 10862, + "gers": 10863, + "Ġich": 10864, + "(start": 10865, + "205": 10866, + "/app": 10867, + "Ġbrother": 10868, + "Memory": 10869, + "Outlet": 10870, + "Ġutf": 10871, + "prec": 10872, + "Ġnavigation": 10873, + "ORK": 10874, + "Ġdst": 10875, + "Detail": 10876, + "Ġaudience": 10877, + "Ġdur": 10878, + "Ġcluster": 10879, + "unched": 10880, + "Ġ],": 10881, + "Ġcomfortable": 10882, + ".values": 10883, + "ĠTotal": 10884, + "Ġsnap": 10885, + "Ġstandards": 10886, + "Ġperformed": 10887, + "hand": 10888, + "(\"@": 10889, + "åŃ": 10890, + "Ġphil": 10891, + "ibr": 10892, + "trim": 10893, + "Ġforget": 10894, + "157": 10895, + "Ġdoctor": 10896, + ".TextBox": 10897, + "377": 10898, + "icons": 10899, + ",s": 10900, + "ĠOp": 10901, + "Sm": 10902, + "Stop": 10903, + "ĉList": 10904, + "ĉu": 10905, + "Comment": 10906, + "_VERSION": 10907, + ".Xtra": 10908, + "Person": 10909, + "rb": 10910, + "LOB": 10911, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10912, + "ĠCentral": 10913, + "270": 10914, + "ICK": 10915, + "raq": 10916, + "Ġputting": 10917, + "Ġmd": 10918, + "ĠLove": 10919, + "Program": 10920, + "Border": 10921, + "oor": 10922, + "Ġallowing": 10923, + "after": 10924, + "Ġentries": 10925, + "ĠMaybe": 10926, + "]).": 10927, + "ĠShort": 10928, + ")\\": 10929, + ".now": 10930, + "friend": 10931, + "Ġprefer": 10932, + "ĠGPIO": 10933, + "osis": 10934, + "ĠGameObject": 10935, + "Ġskip": 10936, + "Ġcompetition": 10937, + "_match": 10938, + "lications": 10939, + "_CONT": 10940, + ".groupBox": 10941, + "Ġals": 10942, + "666": 10943, + "\"We": 10944, + "_eq": 10945, + "lan": 10946, + "_search": 10947, + "ĠMusic": 10948, + "asis": 10949, + "Ġbind": 10950, + "ĠIsland": 10951, + "rum": 10952, + "(E": 10953, + "Ġseat": 10954, + "Video": 10955, + "Ġack": 10956, + "reek": 10957, + "={()": 10958, + "Ġrating": 10959, + "Ġrestaurant": 10960, + "456": 10961, + "DEX": 10962, + "(buf": 10963, + "pping": 10964, + "uality": 10965, + "Ġleague": 10966, + "176": 10967, + "Ġfocused": 10968, + "apon": 10969, + "$data": 10970, + "CLUD": 10971, + "CLUDING": 10972, + "Ġabsolute": 10973, + "(query": 10974, + "Ġtells": 10975, + "Ang": 10976, + "Ġcommunities": 10977, + "Ġhonest": 10978, + "oking": 10979, + "Ġapart": 10980, + "arity": 10981, + "/$": 10982, + "_module": 10983, + "ĠEnc": 10984, + ".an": 10985, + ".Config": 10986, + "Cre": 10987, + "Ġshock": 10988, + "ĠArab": 10989, + "IENT": 10990, + "/re": 10991, + "Ġretrie": 10992, + "ycler": 10993, + "isa": 10994, + "ĠOrgan": 10995, + ".graph": 10996, + "Ġí": 10997, + "ĠBAS": 10998, + "Enum": 10999, + "Ġpossibly": 11000, + "ÑĢаÐ": 11001, + "ĠJapanese": 11002, + "Ġcraft": 11003, + "ĠPlace": 11004, + "Ġtalent": 11005, + "Ġfunding": 11006, + "Ġconfirmed": 11007, + "Ġcycle": 11008, + "/x": 11009, + "GE": 11010, + "Ġhearing": 11011, + "Ġplants": 11012, + "Ġmouth": 11013, + "pages": 11014, + "oria": 11015, + "ĠRemove": 11016, + "_total": 11017, + "Ġod": 11018, + "ollapse": 11019, + "door": 11020, + "Ġbought": 11021, + "Ġaddr": 11022, + "ARCH": 11023, + "_dim": 11024, + "dden": 11025, + "Ġdecades": 11026, + "REQUEST": 11027, + "Ġversions": 11028, + "fire": 11029, + "006": 11030, + "Ġmoves": 11031, + "fb": 11032, + "Ġcoffee": 11033, + ".connect": 11034, + "ĠRow": 11035, + "Ġschema": 11036, + "Scope": 11037, + "-Type": 11038, + "Ġfighting": 11039, + "Ġretail": 11040, + "Ġmodified": 11041, + "TF": 11042, + "Files": 11043, + "nie": 11044, + "_command": 11045, + "stone": 11046, + "ĠÑĤ": 11047, + "_thread": 11048, + "Ġbond": 11049, + "ĠDevelopment": 11050, + "Ġpt": 11051, + "FORM": 11052, + "plet": 11053, + "Ġidentified": 11054, + "cpp": 11055, + "206": 11056, + "225": 11057, + "Ġcoding": 11058, + "oked": 11059, + "ĠMaster": 11060, + "IDTH": 11061, + "Ġresidents": 11062, + "redit": 11063, + "ĠPhoto": 11064, + "=-": 11065, + "unte": 11066, + "ateur": 11067, + "159": 11068, + "_STATE": 11069, + "ĠSing": 11070, + "Ġsheet": 11071, + ".val": 11072, + "orse": 11073, + "Ġhers": 11074, + "Ġdetermined": 11075, + "Common": 11076, + "Ġwed": 11077, + "_queue": 11078, + "PH": 11079, + "ĠAtl": 11080, + "cred": 11081, + "/LICENSE": 11082, + "Ġmes": 11083, + "Ġadvanced": 11084, + ".java": 11085, + ".Sh": 11086, + "Go": 11087, + "kill": 11088, + "fp": 11089, + "_settings": 11090, + "Ġpal": 11091, + "Ġtruck": 11092, + "Ġcombined": 11093, + "Ġ\"${": 11094, + "ĠCorpor": 11095, + "Ġjoined": 11096, + "ĠJose": 11097, + "ĠCup": 11098, + "uns": 11099, + "estival": 11100, + "levision": 11101, + "Ġbroken": 11102, + "Ġmarriage": 11103, + "ĠWestern": 11104, + "Ġrepresents": 11105, + "ĠTitle": 11106, + "Ġss": 11107, + ".Ass": 11108, + "ongoose": 11109, + "iento": 11110, + "<>();Ċ": 11111, + "Ġabsolutely": 11112, + "Ġsmooth": 11113, + "TERN": 11114, + "ĠUnless": 11115, + "Word": 11116, + "Ġmerge": 11117, + "igan": 11118, + "ĠVol": 11119, + "Ġnn": 11120, + ".getId": 11121, + "Ġз": 11122, + "171": 11123, + "Ġsexy": 11124, + "Ġseeking": 11125, + "Single": 11126, + ".this": 11127, + "179": 11128, + "Ġkom": 11129, + "bound": 11130, + ";\"": 11131, + "ĠfontSize": 11132, + "_df": 11133, + "Ġinjury": 11134, + "(H": 11135, + "Ġissued": 11136, + "_END": 11137, + ":self": 11138, + "020": 11139, + "Ġpatch": 11140, + "Ġleaves": 11141, + "Ġadopt": 11142, + "FileName": 11143, + "ãĢIJ": 11144, + "Ġexecutive": 11145, + "ĠByte": 11146, + "]))Ċ": 11147, + "Ġnu": 11148, + "outing": 11149, + "cluding": 11150, + "-R": 11151, + ".options": 11152, + "Ġsubstant": 11153, + "avax": 11154, + "ĠBUT": 11155, + "Ġtechnical": 11156, + "Ġtwice": 11157, + "Ġmás": 11158, + "Ġunivers": 11159, + "yr": 11160, + "Ġdrag": 11161, + "ĠDC": 11162, + "Ġsed": 11163, + "Ġbot": 11164, + "ĠPal": 11165, + "ĠHall": 11166, + "forcement": 11167, + "Ġauch": 11168, + ".mod": 11169, + "notation": 11170, + "_files": 11171, + ".line": 11172, + "_flag": 11173, + "[name": 11174, + "Ġresolution": 11175, + "Ġbott": 11176, + "(\"[": 11177, + "ende": 11178, + "(arr": 11179, + "Free": 11180, + "(@\"": 11181, + "ĠDistrict": 11182, + "PEC": 11183, + ":-": 11184, + "Picker": 11185, + "ĠJo": 11186, + "ĠĠĠĠĠĊ": 11187, + "ĠRiver": 11188, + "_rows": 11189, + "Ġhelpful": 11190, + "Ġmassive": 11191, + "---Ċ": 11192, + "Ġmeasures": 11193, + "007": 11194, + "ĠRuntime": 11195, + "Ġworry": 11196, + "ĠSpec": 11197, + "ĉD": 11198, + "ãĢij": 11199, + "Ġ){Ċ": 11200, + "Ġworse": 11201, + "(filename": 11202, + "Ġlay": 11203, + "Ġmagic": 11204, + "ĠTheir": 11205, + "oul": 11206, + "stroy": 11207, + "ĠWhere": 11208, + "280": 11209, + "Ġsudden": 11210, + "Ġdefe": 11211, + "Ġbinding": 11212, + "Ġflight": 11213, + "ĠOnInit": 11214, + "ĠWomen": 11215, + "ĠPolicy": 11216, + "Ġdrugs": 11217, + "ishing": 11218, + "('../": 11219, + "ĠMel": 11220, + "peat": 11221, + "tor": 11222, + "Ġproposed": 11223, + "Ġstated": 11224, + "_RES": 11225, + "Ġeast": 11226, + "212": 11227, + "ĠCONDITION": 11228, + "_desc": 11229, + "Ġwinning": 11230, + "folio": 11231, + "Mapper": 11232, + "ĠPan": 11233, + "ĠAnge": 11234, + ".servlet": 11235, + "Ġcopies": 11236, + "LM": 11237, + "Ġvm": 11238, + "åį": 11239, + "Ġdictionary": 11240, + "Seg": 11241, + "177": 11242, + "elines": 11243, + "ĠSend": 11244, + "Ġiron": 11245, + "ĠFort": 11246, + "166": 11247, + ".domain": 11248, + "Ġdebate": 11249, + "NotNull": 11250, + "eq": 11251, + "acher": 11252, + "lf": 11253, + "ĉfmt": 11254, + "Ġlawy": 11255, + "178": 11256, + "ÄŁ": 11257, + "ĠMen": 11258, + "Ġtrim": 11259, + "(NULL": 11260, + "Ġ!!": 11261, + "Ġpad": 11262, + "Ġfollows": 11263, + "\"][\"": 11264, + "requ": 11265, + "ĠEp": 11266, + ".github": 11267, + "(img": 11268, + "eto": 11269, + "('\\": 11270, + "Services": 11271, + "umbnail": 11272, + "_main": 11273, + "pleted": 11274, + "fortunately": 11275, + "Ġwindows": 11276, + "Ġplane": 11277, + "ĠConnection": 11278, + ".local": 11279, + "uard": 11280, + "}\\": 11281, + "==\"": 11282, + "andon": 11283, + "ĠRoy": 11284, + "west": 11285, + "158": 11286, + "iginal": 11287, + "emies": 11288, + "itz": 11289, + "'):Ċ": 11290, + "ĠPeter": 11291, + "Ġtough": 11292, + "Ġreduced": 11293, + "Ġcalculate": 11294, + "Ġrapid": 11295, + "customer": 11296, + "Ġefficient": 11297, + "Ġmedium": 11298, + "Ġfell": 11299, + ".ref": 11300, + "ĠCas": 11301, + "Ġfeedback": 11302, + "Speed": 11303, + "(output": 11304, + "aje": 11305, + "Ġcategories": 11306, + "Ġfee": 11307, + "};": 11308, + "Ġdeleted": 11309, + "reh": 11310, + "Ġproof": 11311, + "Desc": 11312, + "Build": 11313, + "Ġsides": 11314, + ".ArrayList": 11315, + "-%": 11316, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11317, + "ر": 11318, + ".match": 11319, + "ли": 11320, + "Ġfeels": 11321, + "Ġachieve": 11322, + "Ġclim": 11323, + "_ON": 11324, + "ĠCD": 11325, + "Ġteacher": 11326, + "_current": 11327, + "bn": 11328, + "_PL": 11329, + "isting": 11330, + "Enable": 11331, + "GEN": 11332, + "Ġtv": 11333, + "Ġsock": 11334, + "Ġplays": 11335, + "Ġdiscount": 11336, + "ĠKE": 11337, + "ĠDebug": 11338, + "Fore": 11339, + "ĠIraq": 11340, + "Ġappearance": 11341, + "Mon": 11342, + "Ġstyled": 11343, + "ĠHuman": 11344, + "iot": 11345, + "ĠHistory": 11346, + "Ġsac": 11347, + "ĠCollection": 11348, + "Ġrecommended": 11349, + ".Selected": 11350, + "Ġorganizations": 11351, + "Ġdiscovered": 11352, + "cohol": 11353, + "adas": 11354, + "ĠThomas": 11355, + "May": 11356, + "Ġconserv": 11357, + "Ġdomin": 11358, + "ĠFollow": 11359, + "ĠSection": 11360, + "ĠThanks": 11361, + "Username": 11362, + "Ġrecipe": 11363, + "Ġwonderful": 11364, + ".sleep": 11365, + "_if": 11366, + "ĉĊĉĊ": 11367, + "orno": 11368, + "Ġru": 11369, + "_target": 11370, + ".\"\"": 11371, + "à¦": 11372, + "EventArgs": 11373, + "Ġinputs": 11374, + "Ġfif": 11375, + "Ġvision": 11376, + "cy": 11377, + "ĠSeries": 11378, + ")(((": 11379, + "Ġtrading": 11380, + "Ġmarker": 11381, + "Begin": 11382, + "Ġtypically": 11383, + "Ġcauses": 11384, + "dropdown": 11385, + "_DEBUG": 11386, + "260": 11387, + "Ġdetect": 11388, + "country": 11389, + "!\");Ċ": 11390, + "ĉR": 11391, + "appy": 11392, + "Ġcref": 11393, + "('<": 11394, + "\"=>": 11395, + "ĠLE": 11396, + "reader": 11397, + "Ġadministr": 11398, + "õ": 11399, + "ucket": 11400, + "Ġfashion": 11401, + ".char": 11402, + "izar": 11403, + "Ġdisable": 11404, + "Ġsuc": 11405, + "ĠLive": 11406, + "issue": 11407, + "Ġmetadata": 11408, + "flags": 11409, + "ĠðŁ": 11410, + "Ġcommitted": 11411, + "Ġva": 11412, + "Ġrough": 11413, + "Ġ'''Ċ": 11414, + "Ġhighlight": 11415, + "_vars": 11416, + "VO": 11417, + "Ġencoding": 11418, + "-Z": 11419, + "_sign": 11420, + "$(\"#": 11421, + "Ġrain": 11422, + "reatest": 11423, + "ĠEND": 11424, + "Selection": 11425, + "Ġcandidates": 11426, + "Ġsav": 11427, + ".Empty": 11428, + "Ġdecisions": 11429, + "Ġcollabor": 11430, + "ridge": 11431, + "feed": 11432, + "ression": 11433, + "Ġpersons": 11434, + "VM": 11435, + "008": 11436, + "ega": 11437, + "_BIT": 11438, + "According": 11439, + "acked": 11440, + "Ġdollars": 11441, + "_loss": 11442, + "ĠCost": 11443, + "}\"Ċ": 11444, + "Notification": 11445, + "Ġprostit": 11446, + "Ġauthority": 11447, + ".rec": 11448, + "Ġspokes": 11449, + "ĠToday": 11450, + "istant": 11451, + "ĠHead": 11452, + "âĢĿ.": 11453, + "ertainment": 11454, + "cean": 11455, + "culate": 11456, + "Ġven": 11457, + "However": 11458, + "_arr": 11459, + "Ġtokens": 11460, + "Graph": 11461, + "ĠJud": 11462, + "ĠVirgin": 11463, + "ĠSerial": 11464, + "unning": 11465, + "Mutable": 11466, + "agers": 11467, + ".csv": 11468, + "Ġdeveloping": 11469, + "Ġinstructions": 11470, + "Ġpromise": 11471, + "Ġrequested": 11472, + "_encode": 11473, + "/\"": 11474, + "ĠIcon": 11475, + "uilt": 11476, + "-day": 11477, + "Ġintelligence": 11478, + ".IS": 11479, + "ĠObservable": 11480, + "ĠHard": 11481, + "Bool": 11482, + "211": 11483, + "idential": 11484, + ".Anchor": 11485, + "Ġselling": 11486, + "CI": 11487, + "AGES": 11488, + "tle": 11489, + "bur": 11490, + "UFFER": 11491, + "RY": 11492, + "Ġbigger": 11493, + "Ġrat": 11494, + "Ġfamous": 11495, + "Ġtypename": 11496, + "Ġexplained": 11497, + "}}Ċ": 11498, + "Ġnuclear": 11499, + "-N": 11500, + "Ġcrisis": 11501, + "ĠEnter": 11502, + "Ġanswers": 11503, + "/${": 11504, + "/pl": 11505, + "Ġsequ": 11506, + "_next": 11507, + "mask": 11508, + "Ġstanding": 11509, + "Ġplenty": 11510, + "ĠCross": 11511, + "ĉret": 11512, + "dro": 11513, + "ĠCast": 11514, + "167": 11515, + "=true": 11516, + "ĠChris": 11517, + "icio": 11518, + "ĠMike": 11519, + "Decimal": 11520, + "addComponent": 11521, + "Len": 11522, + "Ġcock": 11523, + "Ġ#{": 11524, + "URN": 11525, + "": 11657, + "Ġ*=": 11658, + "ĠPS": 11659, + "Ġdangerous": 11660, + "[p": 11661, + "OME": 11662, + "Other": 11663, + "ĠStringBuilder": 11664, + "Points": 11665, + "heading": 11666, + "Ġcurrency": 11667, + "Ġpercentage": 11668, + "_API": 11669, + "Ġclassic": 11670, + "thead": 11671, + "ĠMO": 11672, + "FE": 11673, + "Idx": 11674, + "await": 11675, + "Ġè": 11676, + "Ġaccident": 11677, + "Ġvariant": 11678, + "Ġmyst": 11679, + "ĠLand": 11680, + "ĠBre": 11681, + "Ġharm": 11682, + "ĠAcc": 11683, + "Ġcharged": 11684, + "iones": 11685, + "Visibility": 11686, + "arry": 11687, + "ĠLanguage": 11688, + "Ġwalking": 11689, + "\".ĊĊ": 11690, + "ifer": 11691, + "Ġleadership": 11692, + ".From": 11693, + "ynam": 11694, + "Ġtimestamp": 11695, + "ipt": 11696, + "ĠHas": 11697, + "REFER": 11698, + "ĠIts": 11699, + "Ġlistener": 11700, + "UTE": 11701, + "213": 11702, + "_description": 11703, + "Ġexperiences": 11704, + "Ġcreates": 11705, + "RS": 11706, + "cart": 11707, + "black": 11708, + "Ġchoices": 11709, + "war": 11710, + "750": 11711, + "Ġ'''": 11712, + "Ġordered": 11713, + "Ġevening": 11714, + "Ġpil": 11715, + "Ġtun": 11716, + "ĠBad": 11717, + "(app": 11718, + "random": 11719, + "Ġexplicit": 11720, + "Ġarrived": 11721, + "Ġfly": 11722, + "Ġeconom": 11723, + "-mail": 11724, + "Ġlists": 11725, + "Ġarchitect": 11726, + "234": 11727, + "ĠPay": 11728, + "Ġds": 11729, + "ĠSol": 11730, + "Ġvehicles": 11731, + "Hz": 11732, + "-com": 11733, + "Ġking": 11734, + "_equal": 11735, + "ĠHelp": 11736, + "Ġabuse": 11737, + "480": 11738, + "169": 11739, + "--;Ċ": 11740, + "Ġextr": 11741, + "Ġchemical": 11742, + "ä¿": 11743, + "Ġorient": 11744, + "Ġbreath": 11745, + "ĠSpace": 11746, + "(element": 11747, + "wait": 11748, + "DED": 11749, + "igma": 11750, + "Ġentr": 11751, + "Ġsob": 11752, + "-name": 11753, + "Ġaffected": 11754, + "ika": 11755, + "Ġcoal": 11756, + "_work": 11757, + "Ġhundreds": 11758, + "Ġpolitics": 11759, + "subject": 11760, + "Ġconsumer": 11761, + "ANGE": 11762, + "Ġrepeated": 11763, + "Send": 11764, + "Ġ#[": 11765, + "Ġprotocol": 11766, + "Ġleads": 11767, + "useum": 11768, + "Every": 11769, + "808": 11770, + "174": 11771, + "Import": 11772, + "(count": 11773, + "Ġchallenges": 11774, + "Ġnovel": 11775, + "Ġdepart": 11776, + "bits": 11777, + ".Current": 11778, + "Ġ`${": 11779, + "oting": 11780, + "(\\": 11781, + "Ġcreative": 11782, + "Ġbuff": 11783, + "Ġintroduced": 11784, + "usic": 11785, + "modules": 11786, + "Are": 11787, + "-doc": 11788, + "language": 11789, + "_cache": 11790, + "Ġtod": 11791, + "?>": 11792, + "omething": 11793, + "Ġhun": 11794, + "åº": 11795, + "aters": 11796, + "Intent": 11797, + "Ġimplemented": 11798, + "ĠCase": 11799, + "Children": 11800, + "Ġnotification": 11801, + "Renderer": 11802, + "Wrapper": 11803, + "Objects": 11804, + "tl": 11805, + ".Contains": 11806, + "Plugin": 11807, + ".row": 11808, + "Ġforg": 11809, + "Ġpermit": 11810, + "Ġtargets": 11811, + "ĠIF": 11812, + "Ġtip": 11813, + "sex": 11814, + "Ġsupports": 11815, + "Ġfold": 11816, + "photo": 11817, + "},čĊ": 11818, + "Ġgoogle": 11819, + "$('#": 11820, + "Ġsharing": 11821, + "Ġgoods": 11822, + "vs": 11823, + "ĠDan": 11824, + "Rate": 11825, + "ĠMartin": 11826, + "Ġmanner": 11827, + "lie": 11828, + ".The": 11829, + "Internal": 11830, + "ĠCONTR": 11831, + "Mock": 11832, + "RIGHT": 11833, + "Ġ'{": 11834, + "Ġcontrols": 11835, + "Mat": 11836, + "Ġmand": 11837, + "Ġextended": 11838, + "Ok": 11839, + "Ġembed": 11840, + "Ġplanet": 11841, + "ĠNon": 11842, + "-ch": 11843, + ")\",": 11844, + "epar": 11845, + "Ġbelieved": 11846, + "ĠEnvironment": 11847, + "ĠFriend": 11848, + "-res": 11849, + "Ġhandling": 11850, + "nic": 11851, + "-level": 11852, + "scri": 11853, + "Xml": 11854, + "BE": 11855, + "ungen": 11856, + "Ġalter": 11857, + "[idx": 11858, + "Pop": 11859, + "cam": 11860, + "Ġ(((": 11861, + "Ġshipping": 11862, + "Ġbattery": 11863, + "iddleware": 11864, + "MC": 11865, + "Ġimpl": 11866, + "otation": 11867, + "ĠLab": 11868, + "