wenhuach commited on 19 days ago

Commit

cb38f4a

•

1 Parent(s): 7faf1e0

autoround format

Browse files

Signed-off-by: wenhuach <wenhuach87@gmail.com>

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
config.json +58 -0
generation_config.json +12 -0
model-00001-of-00044.safetensors +3 -0
model-00002-of-00044.safetensors +3 -0
model-00003-of-00044.safetensors +3 -0
model-00004-of-00044.safetensors +3 -0
model-00005-of-00044.safetensors +3 -0
model-00006-of-00044.safetensors +3 -0
model-00007-of-00044.safetensors +3 -0
model-00008-of-00044.safetensors +3 -0
model-00009-of-00044.safetensors +3 -0
model-00010-of-00044.safetensors +3 -0
model-00011-of-00044.safetensors +3 -0
model-00012-of-00044.safetensors +3 -0
model-00013-of-00044.safetensors +3 -0
model-00014-of-00044.safetensors +3 -0
model-00015-of-00044.safetensors +3 -0
model-00016-of-00044.safetensors +3 -0
model-00017-of-00044.safetensors +3 -0
model-00018-of-00044.safetensors +3 -0
model-00019-of-00044.safetensors +3 -0
model-00020-of-00044.safetensors +3 -0
model-00021-of-00044.safetensors +3 -0
model-00022-of-00044.safetensors +3 -0
model-00023-of-00044.safetensors +3 -0
model-00024-of-00044.safetensors +3 -0
model-00025-of-00044.safetensors +3 -0
model-00026-of-00044.safetensors +3 -0
model-00027-of-00044.safetensors +3 -0
model-00028-of-00044.safetensors +3 -0
model-00029-of-00044.safetensors +3 -0
model-00030-of-00044.safetensors +3 -0
model-00031-of-00044.safetensors +3 -0
model-00032-of-00044.safetensors +3 -0
model-00033-of-00044.safetensors +3 -0
model-00034-of-00044.safetensors +3 -0
model-00035-of-00044.safetensors +3 -0
model-00036-of-00044.safetensors +3 -0
model-00037-of-00044.safetensors +3 -0
model-00038-of-00044.safetensors +3 -0
model-00039-of-00044.safetensors +3 -0
model-00040-of-00044.safetensors +3 -0
model-00041-of-00044.safetensors +3 -0
model-00042-of-00044.safetensors +3 -0
model-00043-of-00044.safetensors +3 -0
model-00044-of-00044.safetensors +3 -0
model.safetensors.index.json +0 -0
quantization_config.json +24 -0
special_tokens_map.json +16 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

config.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "_name_or_path": "/data6/models/Meta-Llama-3.1-405B-Instruct",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 16384,
+  "initializer_range": 0.02,
+  "intermediate_size": 53248,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 128,
+  "num_hidden_layers": 126,
+  "num_key_value_heads": 16,
+  "pretraining_tp": 1,
+  "quantization_config": {
+    "amp": true,
+    "autoround_version": "0.4.3",
+    "backend": "auto_round:gptq:exllamav2",
+    "batch_size": 1,
+    "bits": 4,
+    "data_type": "int",
+    "dataset": "NeelNanda/pile-10k",
+    "enable_minmax_tuning": true,
+    "enable_norm_bias_tuning": false,
+    "enable_quanted_input": true,
+    "gradient_accumulate_steps": 4,
+    "group_size": -1,
+    "iters": 200,
+    "low_gpu_mem_usage": true,
+    "lr": 0.005,
+    "minmax_lr": 0.005,
+    "nsamples": 128,
+    "quant_method": "intel/auto-round",
+    "scale_dtype": "torch.float16",
+    "seqlen": 2048,
+    "sym": true,
+    "to_quant_block_names": null
+  },
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "vocab_size": 128256
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "bos_token_id": 128000,
+  "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.47.0"
+}

model-00001-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0e012ec3f44deea4607dbebbbe67e1ae7c0c16050cd756518548e30f7d65428
+size 4941445440

model-00002-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2f8259ff72a4e903925be56639246e4510ac4419cb11b6ff0cc25ad32b8746c
+size 4835061656

model-00003-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:149f5e7eaadabc17813947121b978471dc7bc7338ffddf34fabda3e1111e6b98
+size 4835061656

model-00004-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5167bf2c990e8f58a535eebd0c9c2ef2668e5115370f7757b71c18994de1e55d
+size 4835061656

model-00005-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d44db660ffa81ba4afbeab4ac5ca127499367b9a13d19878bbf58c9f18f4ee8
+size 4835061736

model-00006-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c3855cf7aecdf9fae01a3632e9ee90a17434ac4de35f7227e6b4c5b78d03281
+size 4835061752

model-00007-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d57299a546ab60d40a468751a330663338593ed74a9f5465be698ff2695bb0bb
+size 4835061752

model-00008-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f47b6c03f6bcb2e59285a0a403b3504e88cccbe869d74c690f264869cf1a9d54
+size 4835061752

model-00009-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e477431cc9ef00190fa9ef2954197fb39068ea162aa3d160d695d65a9aa93dac
+size 4835061752

model-00010-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9d1ddf3a47512dac382a0b3546950c2e5863ee228c8945cb5e2bee5d578f394
+size 4835061752

model-00011-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0c2e19f2bfb9bfe837f2e8ee4d7819e202e2db3030a5d9feeec8b8cf0b15e48
+size 4835061752

model-00012-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c11ec4493cf163310f26029858759d236d04b0f6378ec4eb7cbf6283821c8e8
+size 4835061752

model-00013-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a206bf08b0b9048548879e3046e07361e22ff992df307488a540d2df1f4f82f8
+size 4835061752

model-00014-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0252d569d041e4c5888f71b756c9c730f7c3fadfef597f51587aa1b9099d46f8
+size 4835061752

model-00015-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:debb9846b20a6cda398269af579dd3da5f293143507c804ed02d57a4d3c2e867
+size 4835061752

model-00016-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:356ffcfa18ac44c18f5557391279d869bc5986deca193f3e7f385ddbc0e40f48
+size 4835061752

model-00017-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41e3b385c7345b5d820f28b6114ba9e212632ac7a785572ae6933515717f96cc
+size 4835061752

model-00018-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a80d005a53159a2fe5fcd1d65d0b1e3119cd0a50ef0392868019f5303fc92fb
+size 4835061752

model-00019-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5edd68e3305fa4d6c535efb69369093e42d4841ba61ff202f515791426fa57f0
+size 4835061752

model-00020-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49e1956c7d365141cedda43d5f62bffd60b6812c22fd4912746cafa9bce0d357
+size 4835061752

model-00021-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:27edf55ba8497284bb2684a267efa8adfdc10af2f2cdebd46bdb73f32727b6be
+size 4835061752

model-00022-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e52d195e2b475c3b632b66e3311ad056d0b6b58853d37df94f826e25ead431bd
+size 4835061752

model-00023-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:db951f808f3944001357bf8e5bf4aa6fcb022a9d1685966872b729d72e744b8d
+size 4835061752

model-00024-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae76848da89b0300f8e649d1c49c9de351723c2692c80bc53715567e6165a92b
+size 4835061752

model-00025-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:09417331a6dacd03dc6273a5e62917659dd9c7b030e8f90d88354619cb4d6257
+size 4835061752

model-00026-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef43240ab186dd84029eb2e2c78843be4c0c9b4acb85ed875821e62d98d2630c
+size 4835061752

model-00027-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9dc748768c9df33ae5028f9cb9382bdc938c058b47a9001da5cd73309b4ac348
+size 4835061752

model-00028-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd52c89e204eb68f397ecab0264591d3394e972c31b4a4b7b332a71b637b1713
+size 4835061752

model-00029-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d98a912a986079821863e330ba02b0230a2ca4ebd3594aedf5ada74685a8a339
+size 4835061752

model-00030-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e27bd3d17d644d72c8a93ae3a7f544f56b72b13b075d0ceb1283a439b13d8397
+size 4835061752

model-00031-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7dd207b62db6f459c3142cacd4316078f7cfed927a5c1b5dd586598bde4e66c
+size 4835061752

model-00032-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:363f75e93850dd5bbf21085c46998d2de4be8fe7ea3e6df86be2bb01c60320a3
+size 4835061752

model-00033-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0a6f8859542abce3a64b8490dcce0a74577f7e68a792dc9ee9d2d977a2e81ec
+size 4835061752

model-00034-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d051d247352a1176b33fdede0e1fb8d20863cd5bc6e6b3ca9b1c7d2f1e3f475d
+size 4835061752

model-00035-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d27196eb6805942f7fe28e98ed367e836e0bb9218923e7538ea4e09fb7fd31c1
+size 4835061832

model-00036-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87f2fea2a9d710060eb986ea952f5feb1ce948b229236ca499687146df196032
+size 4835061840

model-00037-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5db7c3d7fa72c39de61c7c1aced4528eb7cafb5fbc32546e63ee7b8864f8d192
+size 4835061840

model-00038-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88ad6d6599bc4299ca5a292c3863fc8a6cdc86ffe5d151fb914494ed685a9ae3
+size 4835061840

model-00039-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:79fba7636576365e5b266a55cd1c56b2d40c18f1fb98dc52abb52a1c136ca6a4
+size 4835061840

model-00040-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d570b4ccaf60a7f4d0cfbb999dae5f10fb47b6e35083804469a764bada4dee66
+size 4835061840

model-00041-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8660c30ebc4ce89e1d9f71fd5049ff8b9001d0efc9fc9ec0a7c5b51de1c244f
+size 4835061840

model-00042-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:475c7145b02f53c208e53add8e3defcdfd08d6283d71d498ef21a3a52c7d11b5
+size 4835061840

model-00043-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:051d02b61978157fb7820ce51a20b6918d56835a6cc856e72dfac5cf675dfc35
+size 4096341936

model-00044-of-00044.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
+size 4202692736

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

quantization_config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bits": 4,
+  "group_size": -1,
+  "sym": true,
+  "data_type": "int",
+  "enable_quanted_input": true,
+  "enable_minmax_tuning": true,
+  "seqlen": 2048,
+  "batch_size": 1,
+  "scale_dtype": "torch.float16",
+  "lr": 0.005,
+  "minmax_lr": 0.005,
+  "gradient_accumulate_steps": 4,
+  "iters": 200,
+  "amp": true,
+  "nsamples": 128,
+  "low_gpu_mem_usage": true,
+  "to_quant_block_names": null,
+  "enable_norm_bias_tuning": false,
+  "dataset": "NeelNanda/pile-10k",
+  "autoround_version": "0.4.3",
+  "quant_method": "intel/auto-round",
+  "backend": "auto_round:gptq:exllamav2"
+}

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}