add model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +35 -0
- generation_config.json +9 -0
- model-00001-of-00062.safetensors +3 -0
- model-00002-of-00062.safetensors +3 -0
- model-00003-of-00062.safetensors +3 -0
- model-00004-of-00062.safetensors +3 -0
- model-00005-of-00062.safetensors +3 -0
- model-00006-of-00062.safetensors +3 -0
- model-00007-of-00062.safetensors +3 -0
- model-00008-of-00062.safetensors +3 -0
- model-00009-of-00062.safetensors +3 -0
- model-00010-of-00062.safetensors +3 -0
- model-00011-of-00062.safetensors +3 -0
- model-00012-of-00062.safetensors +3 -0
- model-00013-of-00062.safetensors +3 -0
- model-00014-of-00062.safetensors +3 -0
- model-00015-of-00062.safetensors +3 -0
- model-00016-of-00062.safetensors +3 -0
- model-00017-of-00062.safetensors +3 -0
- model-00018-of-00062.safetensors +3 -0
- model-00019-of-00062.safetensors +3 -0
- model-00020-of-00062.safetensors +3 -0
- model-00021-of-00062.safetensors +3 -0
- model-00022-of-00062.safetensors +3 -0
- model-00023-of-00062.safetensors +3 -0
- model-00024-of-00062.safetensors +3 -0
- model-00025-of-00062.safetensors +3 -0
- model-00026-of-00062.safetensors +3 -0
- model-00027-of-00062.safetensors +3 -0
- model-00028-of-00062.safetensors +3 -0
- model-00029-of-00062.safetensors +3 -0
- model-00030-of-00062.safetensors +3 -0
- model-00031-of-00062.safetensors +3 -0
- model-00032-of-00062.safetensors +3 -0
- model-00033-of-00062.safetensors +3 -0
- model-00034-of-00062.safetensors +3 -0
- model-00035-of-00062.safetensors +3 -0
- model-00036-of-00062.safetensors +3 -0
- model-00037-of-00062.safetensors +3 -0
- model-00038-of-00062.safetensors +3 -0
- model-00039-of-00062.safetensors +3 -0
- model-00040-of-00062.safetensors +3 -0
- model-00041-of-00062.safetensors +3 -0
- model-00042-of-00062.safetensors +3 -0
- model-00043-of-00062.safetensors +3 -0
- model-00044-of-00062.safetensors +3 -0
- model-00045-of-00062.safetensors +3 -0
- model-00046-of-00062.safetensors +3 -0
- model-00047-of-00062.safetensors +3 -0
- model-00048-of-00062.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/rl/web_policy/llama3-70b/web_policy_sft_lite_2/checkpoint-296",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 64,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": {
|
23 |
+
"factor": 8.0,
|
24 |
+
"high_freq_factor": 4.0,
|
25 |
+
"low_freq_factor": 1.0,
|
26 |
+
"original_max_position_embeddings": 8192,
|
27 |
+
"rope_type": "llama3"
|
28 |
+
},
|
29 |
+
"rope_theta": 500000.0,
|
30 |
+
"tie_word_embeddings": false,
|
31 |
+
"torch_dtype": "float32",
|
32 |
+
"transformers_version": "4.43.2",
|
33 |
+
"use_cache": false,
|
34 |
+
"vocab_size": 128256
|
35 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128001,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.9,
|
8 |
+
"transformers_version": "4.43.2"
|
9 |
+
}
|
model-00001-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3404d2ba990f54a95c0221ed5414e9cb2570e45ddc77f8e9565dea0aea961719
|
3 |
+
size 4806672984
|
model-00002-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72199a8aceef2e835b9b5987daab8a841745bfcc331bd9174de5d64d26946de0
|
3 |
+
size 4362142864
|
model-00003-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20a23011a958ea0e7480060615e3ea6c15f35375bb86df8eba73078585627dad
|
3 |
+
size 4362142864
|
model-00004-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7219a0d3fe8cdff0309d057b9b6d13a4d01dbacc3dc10ed71f4dc74270663ff8
|
3 |
+
size 4966188864
|
model-00005-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e89a3473c64fdf1a3bfd069b3628b90af51ccea055cf14c484ba195d45e5135
|
3 |
+
size 4362142864
|
model-00006-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:012e96f4b2816c90eaf587d29fef68d70d5a84131489a58f047ba65f364e11bc
|
3 |
+
size 4362142864
|
model-00007-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be24fd7a37045c5ff8bb8d7c36f197c88c06f5cb1b0dadb7f8bd21658ea6a49b
|
3 |
+
size 4966188864
|
model-00008-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3bc35523b1de13cdb1ec4eef0593bacee687c41f9b82521a2f249d37205c97
|
3 |
+
size 4362142864
|
model-00009-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8b35d1ff363dd0b2977043111cc3fad425677f6c9de46b48b3c0cfaddeb7961
|
3 |
+
size 4362142880
|
model-00010-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46ae4e44fb2fc197964a252d44b68680503d63980de1e6a8e9a3a6d6afb073dc
|
3 |
+
size 4966188880
|
model-00011-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9714f7c49ab876edcea363ab270521a455458c0cab7a32364736f899a1fbd0fb
|
3 |
+
size 4362142872
|
model-00012-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c88a8fee892208e6eff32c1fa75dc3e369a44d2990a6fc2646fd41bf992bf6e0
|
3 |
+
size 4362142872
|
model-00013-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:978e04f2c165c7a4c404458e12238461b038a67981ee1c8088dc6c52c5cb357c
|
3 |
+
size 4966188880
|
model-00014-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e6975d11fdfb81579e33c9349800e67d44e8054b3c1e68217cd81b3d0e1a3d9
|
3 |
+
size 4362142872
|
model-00015-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:405618f22edc77235903222903caa55c296fdc7e479feeb8d940d5de90d4c754
|
3 |
+
size 4362142872
|
model-00016-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9456c12b6533799e9c7e3db07d63a15ca86bb00def863653fa253320c6cdd732
|
3 |
+
size 4966188880
|
model-00017-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ebe1c6cdd65a6aa6ad9923961489e9f8bcfa8f012b21bcdaa0beb3e1ac56804
|
3 |
+
size 4362142872
|
model-00018-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a1846460db0a3f99f36335d2db7dececec759d9fa6d59a9a231d42a24890e36
|
3 |
+
size 4362142872
|
model-00019-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e1ebb2f52db274445274003f9ea683f0ea794fbb9d31bc5e2efbe1ba0283860
|
3 |
+
size 4966188880
|
model-00020-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5f35bd967c6cbed4e01815d3895060fd2418bb5a7460bd3d9edaf96d597be55
|
3 |
+
size 4362142872
|
model-00021-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c88981044dda235a940afd8299e572ed0a6e5aa785c65a9f29821be75292af2
|
3 |
+
size 4362142872
|
model-00022-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b38004ba62b1704d032055dcd1abdb02c8160c15a11b61dcdbbbc0355111f99
|
3 |
+
size 4966188880
|
model-00023-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e77aa0bfb01b67761adcb7cca4f3a9a41b8d749ae081acb82ad802c631438d6
|
3 |
+
size 4362142872
|
model-00024-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:712492ca1a5d4aefa7975e795848d423de9ad5cbd35bd258251640b7a5c52c1b
|
3 |
+
size 4362142872
|
model-00025-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1327f1ba2277184bed0fd21aa5ff496229db4afcb57fed31c00e2d5f7f7c2805
|
3 |
+
size 4966188880
|
model-00026-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03d2ba7cb253291fc3321e31e07ccccd687e361245df9f7c508ed2f3bbbc2345
|
3 |
+
size 4362142872
|
model-00027-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e8d67c44415cc17f2b5f4f3eb4a7bd8f55e49709eaa83312a0bb0ac01521667
|
3 |
+
size 4362142872
|
model-00028-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a66ae624746da7f974b73d511762c1dc9e9a62626dc9e8b2a15dae16d7879a3e
|
3 |
+
size 4966188880
|
model-00029-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4785fa27e309cfbd4de262b633fe0284dc774cc88608c56c02877a6a68ae9b75
|
3 |
+
size 4362142872
|
model-00030-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55b93c5f30204c5960bb707cbe6ea36c205243ed74a5a9487524ebded6fda0dc
|
3 |
+
size 4362142872
|
model-00031-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9105fd593721440b61f7a619abb714f95d972eafa9cd2155c4ff315b7a245a22
|
3 |
+
size 4966188880
|
model-00032-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb2747e11267cf8982c6068c4bff5963c9a7339569de70d66aa321d329e094e5
|
3 |
+
size 4362142872
|
model-00033-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a10dfb96cb1bf30d5946379929b4c8dbbac2e78e8388c8126302c5cc6119290
|
3 |
+
size 4362142872
|
model-00034-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49eed91ff3b487d7b305c9c5776bd455759d2d66950d80ce14732f36c932f5d4
|
3 |
+
size 4966188880
|
model-00035-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5300e471b9b7f3e1263778a81165ac2698854f86091af09d98d784ca8d22e22
|
3 |
+
size 4362142872
|
model-00036-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f85cf7791eef492c325cb7414fcfbac92dfb8c78142d73fc2c1aaddb3e8e1d91
|
3 |
+
size 4362142872
|
model-00037-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ab8f3a9dcba75892cc464c26101c88cc583549510f8a94fbf32db376989eb9f
|
3 |
+
size 4966188880
|
model-00038-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ffae158c4669f78e8693b13886a8c9136b5aebc5a07ad863797b799b1387ef7
|
3 |
+
size 4362142872
|
model-00039-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de83619f45f7665ae210daa1d4c7a60f028c8abdc11a4ec5fbc3c1586e960028
|
3 |
+
size 4362142872
|
model-00040-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c619a21dfb1fe420ef3dec587d6a4d74659fce63ba2018a3fcf755e99e0d35b3
|
3 |
+
size 4966188880
|
model-00041-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e294ecb1d3f0f64257f95e7e2ca0bd31aa0c5d83f6889055ab60e6413a10a1b
|
3 |
+
size 4362142872
|
model-00042-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74689f419487b8ec2b6e31bf8cc666a6d77644ac60fc1ab66d29b4e36f034b78
|
3 |
+
size 4362142872
|
model-00043-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f303589fa6bf348d4eb5636576156d80465e16f32c16942b216a2b50a52de478
|
3 |
+
size 4966188880
|
model-00044-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7edf26860eef18dcfeea97ddc672b9be571bfdb737cdf951400bd26b381c046
|
3 |
+
size 4362142872
|
model-00045-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35712376847838c581daf63240887f7b0d22ca57953024417ccd524861ec1703
|
3 |
+
size 4362142872
|
model-00046-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89101c6561b05f574139efefa2c039ee8cca34030e6de04edcd298634e412036
|
3 |
+
size 4966188880
|
model-00047-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8627808fd60fe4a851e05fcd80a6c9939dd057572480e98bccabc549b0c5abf6
|
3 |
+
size 4362142872
|
model-00048-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fdbff1ee77059beefaf11741b0ad03ef8fb495e7d33864797af262876adb276
|
3 |
+
size 4362142872
|