cwaud commited on
Commit
75f730c
1 Parent(s): ba2f951

Training in progress, step 5

Browse files
adapter_config.json CHANGED
@@ -20,11 +20,11 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "o_proj",
24
  "up_proj",
25
- "k_proj",
26
  "gate_proj",
 
27
  "down_proj",
 
28
  "q_proj",
29
  "v_proj"
30
  ],
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "up_proj",
 
24
  "gate_proj",
25
+ "o_proj",
26
  "down_proj",
27
+ "k_proj",
28
  "q_proj",
29
  "v_proj"
30
  ],
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9851f2ce2335fa9ceff2d08c7791e820790ceffb6985e73379c7f3b6164d098
3
- size 1095799992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eaf666384dd4097633b64380f5256d90c768219ac3ef92ed6198968879cc234
3
+ size 45118424
config.json CHANGED
@@ -47,5 +47,5 @@
47
  "torch_dtype": "bfloat16",
48
  "transformers_version": "4.45.1",
49
  "use_cache": false,
50
- "vocab_size": 128257
51
  }
 
47
  "torch_dtype": "bfloat16",
48
  "transformers_version": "4.45.1",
49
  "use_cache": false,
50
+ "vocab_size": 128256
51
  }
special_tokens_map.json CHANGED
@@ -14,7 +14,7 @@
14
  "single_word": false
15
  },
16
  "pad_token": {
17
- "content": " ",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
 
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "<|finetune_right_pad_id|>",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22e9418ab95984e7ef5a01738e939415416ecded62e900139d3054935604f200
3
- size 17210098
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b
3
+ size 17209920
tokenizer_config.json CHANGED
@@ -2047,14 +2047,6 @@
2047
  "rstrip": false,
2048
  "single_word": false,
2049
  "special": true
2050
- },
2051
- "128256": {
2052
- "content": " ",
2053
- "lstrip": false,
2054
- "normalized": false,
2055
- "rstrip": false,
2056
- "single_word": false,
2057
- "special": true
2058
  }
2059
  },
2060
  "bos_token": "<|begin_of_text|>",
@@ -2066,7 +2058,7 @@
2066
  "attention_mask"
2067
  ],
2068
  "model_max_length": 131072,
2069
- "pad_token": " ",
2070
  "padding_side": "left",
2071
  "tokenizer_class": "PreTrainedTokenizerFast"
2072
  }
 
2047
  "rstrip": false,
2048
  "single_word": false,
2049
  "special": true
 
 
 
 
 
 
 
 
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
 
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 131072,
2061
+ "pad_token": "<|finetune_right_pad_id|>",
2062
  "padding_side": "left",
2063
  "tokenizer_class": "PreTrainedTokenizerFast"
2064
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26b16adc3474dc959339f40a125db5e9e705f95a61ba36f94f606cb65722e3a6
3
  size 6648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8bb872fc4af979d4644be3a4e7cd832ace947512f06305456d5f8aadcc96d23
3
  size 6648