qwen-2-q0f16-MLC / ndarray-cache.json
geonmin-kim's picture
Upload folder using huggingface_hub
7bed016 verified
{
"metadata": {
"ParamSize": 31,
"ParamBytes": 3821161472.0,
"BitsPerParam": 16.0
},
"records": [
{
"dataPath": "params_shard_0.bin",
"format": "raw-shard",
"nbytes": 978345984,
"records": [
{
"name": "lm_head.weight",
"shape": [
136488,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 978345984,
"byteOffset": 0
}
],
"md5sum": "f24bc2a390a565ec24307333d9aa9b5b"
},
{
"dataPath": "params_shard_1.bin",
"format": "raw-shard",
"nbytes": 135790592,
"records": [
{
"name": "model.layers.3.mlp.down_proj.weight",
"shape": [
3584,
18944
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 135790592,
"byteOffset": 0
}
],
"md5sum": "8463225b5d39d8aa6befc7e394ff9a80"
},
{
"dataPath": "params_shard_2.bin",
"format": "raw-shard",
"nbytes": 271581184,
"records": [
{
"name": "model.layers.3.mlp.gate_up_proj.weight",
"shape": [
37888,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 271581184,
"byteOffset": 0
}
],
"md5sum": "ce9430ea30508f4c11646d9f6987c7d5"
},
{
"dataPath": "params_shard_3.bin",
"format": "raw-shard",
"nbytes": 978345984,
"records": [
{
"name": "model.embed_tokens.weight",
"shape": [
136488,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 978345984,
"byteOffset": 0
}
],
"md5sum": "2034469190648e591720406f8f5d6931"
},
{
"dataPath": "params_shard_4.bin",
"format": "raw-shard",
"nbytes": 135790592,
"records": [
{
"name": "model.layers.0.mlp.down_proj.weight",
"shape": [
3584,
18944
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 135790592,
"byteOffset": 0
}
],
"md5sum": "d8c5636ba8c54a1bf9a9be52028edd24"
},
{
"dataPath": "params_shard_5.bin",
"format": "raw-shard",
"nbytes": 271581184,
"records": [
{
"name": "model.layers.0.mlp.gate_up_proj.weight",
"shape": [
37888,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 271581184,
"byteOffset": 0
}
],
"md5sum": "eab8149d005afce177602e3a0502e2d5"
},
{
"dataPath": "params_shard_6.bin",
"format": "raw-shard",
"nbytes": 25690112,
"records": [
{
"name": "model.layers.0.self_attn.o_proj.weight",
"shape": [
3584,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 25690112,
"byteOffset": 0
}
],
"md5sum": "23278f4c2c2bd26e27c57bf98ad4ef8c"
},
{
"dataPath": "params_shard_7.bin",
"format": "raw-shard",
"nbytes": 135790592,
"records": [
{
"name": "model.layers.1.mlp.down_proj.weight",
"shape": [
3584,
18944
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 135790592,
"byteOffset": 0
}
],
"md5sum": "ccb811f73867d1f386520f524f2c01a2"
},
{
"dataPath": "params_shard_8.bin",
"format": "raw-shard",
"nbytes": 271581184,
"records": [
{
"name": "model.layers.1.mlp.gate_up_proj.weight",
"shape": [
37888,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 271581184,
"byteOffset": 0
}
],
"md5sum": "92a7bea5fcddf575091c43b1c4df714c"
},
{
"dataPath": "params_shard_9.bin",
"format": "raw-shard",
"nbytes": 33030144,
"records": [
{
"name": "model.layers.1.self_attn.c_attn.weight",
"shape": [
4608,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 33030144,
"byteOffset": 0
}
],
"md5sum": "c03154c2e7e28390bd1554a72a582034"
},
{
"dataPath": "params_shard_10.bin",
"format": "raw-shard",
"nbytes": 25690112,
"records": [
{
"name": "model.layers.1.self_attn.o_proj.weight",
"shape": [
3584,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 25690112,
"byteOffset": 0
}
],
"md5sum": "d46398b81504bd2d82830108afdd8407"
},
{
"dataPath": "params_shard_11.bin",
"format": "raw-shard",
"nbytes": 135790592,
"records": [
{
"name": "model.layers.2.mlp.down_proj.weight",
"shape": [
3584,
18944
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 135790592,
"byteOffset": 0
}
],
"md5sum": "dd79708597c0102a78c1c7487114aafe"
},
{
"dataPath": "params_shard_12.bin",
"format": "raw-shard",
"nbytes": 271581184,
"records": [
{
"name": "model.layers.2.mlp.gate_up_proj.weight",
"shape": [
37888,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 271581184,
"byteOffset": 0
}
],
"md5sum": "56b5611e7e548cbe8da292871a122b53"
},
{
"dataPath": "params_shard_13.bin",
"format": "raw-shard",
"nbytes": 33030144,
"records": [
{
"name": "model.layers.2.self_attn.c_attn.weight",
"shape": [
4608,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 33030144,
"byteOffset": 0
}
],
"md5sum": "8af6d905b41911171901c0c9b1309afb"
},
{
"dataPath": "params_shard_14.bin",
"format": "raw-shard",
"nbytes": 25690112,
"records": [
{
"name": "model.layers.2.self_attn.o_proj.weight",
"shape": [
3584,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 25690112,
"byteOffset": 0
}
],
"md5sum": "126e17f7b67d299092e34621d3d01ba5"
},
{
"dataPath": "params_shard_15.bin",
"format": "raw-shard",
"nbytes": 33030144,
"records": [
{
"name": "model.layers.3.self_attn.c_attn.weight",
"shape": [
4608,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 33030144,
"byteOffset": 0
}
],
"md5sum": "10c68f4a89d8c9e5ac3fd00b5ce2ee47"
},
{
"dataPath": "params_shard_16.bin",
"format": "raw-shard",
"nbytes": 25690112,
"records": [
{
"name": "model.layers.3.self_attn.o_proj.weight",
"shape": [
3584,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 25690112,
"byteOffset": 0
}
],
"md5sum": "e655468aacdcefbc5172993aea2634e2"
},
{
"dataPath": "params_shard_17.bin",
"format": "raw-shard",
"nbytes": 33131520,
"records": [
{
"name": "model.layers.3.input_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 0
},
{
"name": "model.layers.3.post_attention_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 7168
},
{
"name": "model.norm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 14336
},
{
"name": "model.layers.0.input_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 21504
},
{
"name": "model.layers.0.post_attention_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 28672
},
{
"name": "model.layers.0.self_attn.c_attn.bias",
"shape": [
4608
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 9216,
"byteOffset": 35840
},
{
"name": "model.layers.0.self_attn.c_attn.weight",
"shape": [
4608,
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 33030144,
"byteOffset": 45056
},
{
"name": "model.layers.1.input_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 33075200
},
{
"name": "model.layers.1.post_attention_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 33082368
},
{
"name": "model.layers.1.self_attn.c_attn.bias",
"shape": [
4608
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 9216,
"byteOffset": 33089536
},
{
"name": "model.layers.2.input_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 33098752
},
{
"name": "model.layers.2.post_attention_layernorm.weight",
"shape": [
3584
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 7168,
"byteOffset": 33105920
},
{
"name": "model.layers.2.self_attn.c_attn.bias",
"shape": [
4608
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 9216,
"byteOffset": 33113088
},
{
"name": "model.layers.3.self_attn.c_attn.bias",
"shape": [
4608
],
"dtype": "float16",
"format": "f32-to-bf16",
"nbytes": 9216,
"byteOffset": 33122304
}
],
"md5sum": "8024ca13796190a329892865444cd3d9"
}
]
}