ricklamers
commited on
Commit
•
80ef0bf
1
Parent(s):
ebbcf0b
feat: update to better 70b dpo tune
Browse files- config.json +3 -3
- generation_config.json +2 -2
- model-00001-of-00030.safetensors +2 -2
- model-00002-of-00030.safetensors +2 -2
- model-00003-of-00030.safetensors +2 -2
- model-00004-of-00030.safetensors +2 -2
- model-00005-of-00030.safetensors +2 -2
- model-00006-of-00030.safetensors +2 -2
- model-00007-of-00030.safetensors +2 -2
- model-00008-of-00030.safetensors +2 -2
- model-00009-of-00030.safetensors +2 -2
- model-00010-of-00030.safetensors +2 -2
- model-00011-of-00030.safetensors +2 -2
- model-00012-of-00030.safetensors +2 -2
- model-00013-of-00030.safetensors +2 -2
- model-00014-of-00030.safetensors +2 -2
- model-00015-of-00030.safetensors +2 -2
- model-00016-of-00030.safetensors +2 -2
- model-00017-of-00030.safetensors +2 -2
- model-00018-of-00030.safetensors +2 -2
- model-00019-of-00030.safetensors +2 -2
- model-00020-of-00030.safetensors +2 -2
- model-00021-of-00030.safetensors +2 -2
- model-00022-of-00030.safetensors +2 -2
- model-00023-of-00030.safetensors +2 -2
- model-00024-of-00030.safetensors +2 -2
- model-00025-of-00030.safetensors +2 -2
- model-00026-of-00030.safetensors +2 -2
- model-00027-of-00030.safetensors +2 -2
- model-00028-of-00030.safetensors +2 -2
- model-00029-of-00030.safetensors +2 -2
- model-00030-of-00030.safetensors +2 -2
- special_tokens_map.json +43 -13
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
@@ -22,8 +22,8 @@
|
|
22 |
"rope_scaling": null,
|
23 |
"rope_theta": 500000.0,
|
24 |
"tie_word_embeddings": false,
|
25 |
-
"torch_dtype": "
|
26 |
"transformers_version": "4.41.2",
|
27 |
-
"use_cache":
|
28 |
"vocab_size": 128262
|
29 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "meta-llama/Meta-Llama-3-70B-Instruct",
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
|
|
22 |
"rope_scaling": null,
|
23 |
"rope_theta": 500000.0,
|
24 |
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "bfloat16",
|
26 |
"transformers_version": "4.41.2",
|
27 |
+
"use_cache": false,
|
28 |
"vocab_size": 128262
|
29 |
}
|
generation_config.json
CHANGED
@@ -6,7 +6,7 @@
|
|
6 |
128009
|
7 |
],
|
8 |
"max_length": 4096,
|
9 |
-
"temperature": 0.
|
10 |
-
"top_p": 0.
|
11 |
"transformers_version": "4.41.2"
|
12 |
}
|
|
|
6 |
128009
|
7 |
],
|
8 |
"max_length": 4096,
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
"transformers_version": "4.41.2"
|
12 |
}
|
model-00001-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89c0cf12c018c38cf7c8b391c163150bf9b7ed0cc6d9ef39dea1a8cb05ccc6c3
|
3 |
+
size 1667887104
|
model-00002-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b773c80ad2a40b3874b5e7e27bae3435a0c7b46b548960f21474641392fd1f01
|
3 |
+
size 2271522816
|
model-00003-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8f2dfa59ce691f77e9f9c61fd5c430f6a6fd05f0e8c7af261dcab451347b9dc
|
3 |
+
size 2902474752
|
model-00004-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:684654854a05cf480fd6078dad5fdc30dc3150abdd0e473a1e8a77ee4a8f7e09
|
3 |
+
size 1926475776
|
model-00005-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d24b87bb35ccfa24148e645511011a0a606b7104f63cffaa18ce62ddb2027acd
|
3 |
+
size 2115403776
|
model-00006-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e4d22a5c2587e7201e580e30b33983672512c61cf360c9c52f167831ed5fca3
|
3 |
+
size 2085535744
|
model-00007-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a16256256708582ebb192d49321a2fb587f7e26b4cf34b3aef7b320871ecf49
|
3 |
+
size 3320299520
|
model-00008-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3893f5ee9b0aeed6f38412cdff44d1f9a9acc972188d889c46961ae6743303dc
|
3 |
+
size 2075869184
|
model-00009-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac3300128ce519ca18bec75cc818270a33f02b21dff51bc139862896fdd49cc7
|
3 |
+
size 2178609152
|
model-00010-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86db844cd3f365fd1f45fb907beff98f0081813f71d8356a820684a88731437c
|
3 |
+
size 2317238272
|
model-00011-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54caa3ed702ad418e81d669b4d4b6e5e09eb2c8f18d22264b2b59a75edb93929
|
3 |
+
size 2744877056
|
model-00012-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9d7e17c168fa1255949fbfe076a48e9f2275946afef00db8a4deab2c9029932
|
3 |
+
size 1326813184
|
model-00013-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09397e734de2662b3769f2aed6775f3a3dc4d970a8c3bdad41319e828f41ee3a
|
3 |
+
size 1561567232
|
model-00014-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9326ddb10d7590df13bac3090d7bf48bf86ff32d64f1e462dd1e19491a0b63fa
|
3 |
+
size 1665040384
|
model-00015-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ae0863d919bcaaacdbe4d96226aaf2a15c3bec7a145a9baaa18f0a172d06a1a
|
3 |
+
size 2390306816
|
model-00016-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6697f8a014e85835d44b83b402dd91b6712b203d1a2cb7708083d9e533550115
|
3 |
+
size 2289614848
|
model-00017-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2558e7fc3dc3fdfde2892167f1ccb2c14847f7321f3814d0db5b41c88fe2ec6
|
3 |
+
size 2891030528
|
model-00018-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dee78cab4bd9e87394346a01e1bea9327dc7b5f3755a85dc49fe89cef48b2ea3
|
3 |
+
size 2341629952
|
model-00019-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92a1d92ae627b31b4ab238023bda6eb2a250a6fcc9ad1638d45e5ce100ed9712
|
3 |
+
size 2105212928
|
model-00020-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b896da817bee7d9ed78115ddc8e040390ee0530829fef1ede2e76d34a28606a
|
3 |
+
size 2810728448
|
model-00021-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a2c8b57bc56b79abb1912fa03e49c89ecf8fb7e915bf42f7b15824d37ec7a54
|
3 |
+
size 3029651456
|
model-00022-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74f4cc5b8bfcf45af3e350e1e017995d4b537d06fb9f746074e5c34027243678
|
3 |
+
size 2894012416
|
model-00023-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b06e19f02ab4cbf03c5c5c76ab2881b2c54cd10cd18b84f14d9ef94c9db6286
|
3 |
+
size 3130228736
|
model-00024-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cfb5fc51d3d63ccd00156687760a316c39bb658eb522aad546f8538f7ce8354
|
3 |
+
size 2198028288
|
model-00025-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c15a0be5c7422bdbb8cb6821223c9784986149a688222df17a7517e6b7a653b7
|
3 |
+
size 1973522432
|
model-00026-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75edb61f8380b8538c97e2836193ac0ebc69709581e3e07eb7de7ae20e583ab8
|
3 |
+
size 2898800640
|
model-00027-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dce82bb4cd6b6d85a4777610c56bd2e4e641f9184d837586b4150314cfff5d55
|
3 |
+
size 3183329280
|
model-00028-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:092b657556324213f842104f7a6323c96f19240be6fd59bcad858b388599c3bc
|
3 |
+
size 2281537536
|
model-00029-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0ac27bb6c9fcd4e6aaf102900ec9febe1ef499bc39eeab9306395e5d3207a53
|
3 |
+
size 1924145152
|
model-00030-of-00030.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61042debc22650145088384224e4ea399eb746ac8a92b63af5f334b573a85c40
|
3 |
+
size 1739042816
|
special_tokens_map.json
CHANGED
@@ -1,11 +1,47 @@
|
|
1 |
{
|
2 |
"additional_special_tokens": [
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9 |
],
|
10 |
"bos_token": {
|
11 |
"content": "<|begin_of_text|>",
|
@@ -21,11 +57,5 @@
|
|
21 |
"rstrip": false,
|
22 |
"single_word": false
|
23 |
},
|
24 |
-
"pad_token":
|
25 |
-
"content": "<|eot_id|>",
|
26 |
-
"lstrip": false,
|
27 |
-
"normalized": false,
|
28 |
-
"rstrip": false,
|
29 |
-
"single_word": false
|
30 |
-
}
|
31 |
}
|
|
|
1 |
{
|
2 |
"additional_special_tokens": [
|
3 |
+
{
|
4 |
+
"content": "<tool_call>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false
|
9 |
+
},
|
10 |
+
{
|
11 |
+
"content": "</tool_call>",
|
12 |
+
"lstrip": false,
|
13 |
+
"normalized": false,
|
14 |
+
"rstrip": false,
|
15 |
+
"single_word": false
|
16 |
+
},
|
17 |
+
{
|
18 |
+
"content": "<tools>",
|
19 |
+
"lstrip": false,
|
20 |
+
"normalized": false,
|
21 |
+
"rstrip": false,
|
22 |
+
"single_word": false
|
23 |
+
},
|
24 |
+
{
|
25 |
+
"content": "</tools>",
|
26 |
+
"lstrip": false,
|
27 |
+
"normalized": false,
|
28 |
+
"rstrip": false,
|
29 |
+
"single_word": false
|
30 |
+
},
|
31 |
+
{
|
32 |
+
"content": "<tool_response>",
|
33 |
+
"lstrip": false,
|
34 |
+
"normalized": false,
|
35 |
+
"rstrip": false,
|
36 |
+
"single_word": false
|
37 |
+
},
|
38 |
+
{
|
39 |
+
"content": "</tool_response>",
|
40 |
+
"lstrip": false,
|
41 |
+
"normalized": false,
|
42 |
+
"rstrip": false,
|
43 |
+
"single_word": false
|
44 |
+
}
|
45 |
],
|
46 |
"bos_token": {
|
47 |
"content": "<|begin_of_text|>",
|
|
|
57 |
"rstrip": false,
|
58 |
"single_word": false
|
59 |
},
|
60 |
+
"pad_token": "<|eot_id|>"
|
|
|
|
|
|
|
|
|
|
|
|
|
61 |
}
|