zitongyang commited on
Commit
a355b93
·
verified ·
1 Parent(s): 98d070e

Upload LlamaForCausalLM

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "meta-llama/Llama-3.1-8B-Instruct",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -11,6 +11,7 @@
11
  128008,
12
  128009
13
  ],
 
14
  "hidden_act": "silu",
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
@@ -33,7 +34,7 @@
33
  "rope_theta": 500000.0,
34
  "tie_word_embeddings": false,
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.43.3",
37
  "use_cache": true,
38
  "vocab_size": 128256
39
  }
 
1
  {
2
+ "_name_or_path": "ckpts/llama_dagger_20241027_010023_iter2",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
11
  128008,
12
  128009
13
  ],
14
+ "head_dim": 128,
15
  "hidden_act": "silu",
16
  "hidden_size": 4096,
17
  "initializer_range": 0.02,
 
34
  "rope_theta": 500000.0,
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "float32",
37
+ "transformers_version": "4.46.0",
38
  "use_cache": true,
39
  "vocab_size": 128256
40
  }
generation_config.json CHANGED
@@ -8,5 +8,5 @@
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
- "transformers_version": "4.43.3"
12
  }
 
8
  ],
9
  "temperature": 0.6,
10
  "top_p": 0.9,
11
+ "transformers_version": "4.46.0"
12
  }
model-00001-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acbd2f6e74010a338fb710f540819eeae08825e732e4fc4785d81184a831a283
3
  size 4886466168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b42565d7de980801baa25e20ceb3ec9191c2e02a1554eb79b95180b6246ce93f
3
  size 4886466168
model-00002-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfdc131cc66c93d4bc3c30ac4f67dd87522ecd56e62f50408af908d501345e3f
3
  size 4832007448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eacdf82e18505450e5fca99f6c420efd927d13942560711727f91607f6a0c3f
3
  size 4832007448
model-00003-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21782fb7c967945cafcc8ed75765c7437f56a57a3ec215eebb8bddccfbe63599
3
  size 4999813112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:467de4f84140758b5c98c161201c482ecb1c38ef4925f614f6f952b37444db83
3
  size 4999813112
model-00004-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c815ade9699a516f44ac0ca2787d11115fbd5694b93531861ea71d1ed1989c68
3
  size 4999813128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aecb0d25dcc2e55f65b1fe68d8e7c1a2525c2b4e01995188ab895d0914c744c8
3
  size 4999813128
model-00005-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0290410d9023913ab3da810357fea671de27b00df03d0fb97dcca75b9bddbae3
3
  size 4832007496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3734eea80f072dac96138f45eed2fbc381678495a87808e0c037e9681b674672
3
  size 4832007496
model-00006-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfc9f3ab3395551b508d3302abc5bbdcc06657c67f953bac73e66c17892b8eed
3
  size 4999813120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d6a99a51d3dcb371684f006a99808c73bd0bb74974ec38e00604fe26816fcfa
3
  size 4999813120
model-00007-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b75e30d72d9baedbeccb47b41715179a6d6aebdd375762045a3e1b9405e1f59
3
  size 2571158184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f4227733885b5c3e32e653456d463912f48847b14a953b8a49ab4670e3fa460
3
  size 2571158184