voidful commited on
Commit
4afce60
·
verified ·
1 Parent(s): 6521122

Training in progress, step 200

Browse files
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad9cc7f4beddacbec9c8276122fd42a150b617af6356a01908319580f9077b51
3
  size 4988522632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa2da824fe76b51a31adc346b27214db6db2f1bf53b97c2bbf11ad69a49a120
3
  size 4988522632
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53dec1875128efa82de06236dd55fe8736578a95d2178a096dd73ca1c0bb2884
3
- size 1856315036
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12b7875946fdd1ddd66c50db49968c586f2c781bf771cf10300dbb8211ef5bf5
3
+ size 2795955204
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 16749197212
4
  },
5
  "weight_map": {
6
  "adapter.bias": "model-00004-of-00004.safetensors",
@@ -14,16 +14,30 @@
14
  "codec_decoding_heads.5.weight": "model-00004-of-00004.safetensors",
15
  "codec_decoding_heads.6.weight": "model-00004-of-00004.safetensors",
16
  "codec_decoding_heads.7.weight": "model-00004-of-00004.safetensors",
17
- "fuser.linear1.bias": "model-00004-of-00004.safetensors",
18
- "fuser.linear1.weight": "model-00004-of-00004.safetensors",
19
- "fuser.linear2.bias": "model-00004-of-00004.safetensors",
20
- "fuser.linear2.weight": "model-00004-of-00004.safetensors",
21
- "fuser.linear3.bias": "model-00004-of-00004.safetensors",
22
- "fuser.linear3.weight": "model-00004-of-00004.safetensors",
23
- "fuser.linear4.bias": "model-00004-of-00004.safetensors",
24
- "fuser.linear4.weight": "model-00004-of-00004.safetensors",
25
- "fuser.linear5.bias": "model-00004-of-00004.safetensors",
26
- "fuser.linear5.weight": "model-00004-of-00004.safetensors",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  "layer_norm.bias": "model-00004-of-00004.safetensors",
28
  "layer_norm.weight": "model-00004-of-00004.safetensors",
29
  "learned_layer_weight": "model-00001-of-00004.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 17688835996
4
  },
5
  "weight_map": {
6
  "adapter.bias": "model-00004-of-00004.safetensors",
 
14
  "codec_decoding_heads.5.weight": "model-00004-of-00004.safetensors",
15
  "codec_decoding_heads.6.weight": "model-00004-of-00004.safetensors",
16
  "codec_decoding_heads.7.weight": "model-00004-of-00004.safetensors",
17
+ "fuser.linears.0.bias": "model-00004-of-00004.safetensors",
18
+ "fuser.linears.0.weight": "model-00004-of-00004.safetensors",
19
+ "fuser.linears.1.bias": "model-00004-of-00004.safetensors",
20
+ "fuser.linears.1.weight": "model-00004-of-00004.safetensors",
21
+ "fuser.linears.10.bias": "model-00004-of-00004.safetensors",
22
+ "fuser.linears.10.weight": "model-00004-of-00004.safetensors",
23
+ "fuser.linears.11.bias": "model-00004-of-00004.safetensors",
24
+ "fuser.linears.11.weight": "model-00004-of-00004.safetensors",
25
+ "fuser.linears.2.bias": "model-00004-of-00004.safetensors",
26
+ "fuser.linears.2.weight": "model-00004-of-00004.safetensors",
27
+ "fuser.linears.3.bias": "model-00004-of-00004.safetensors",
28
+ "fuser.linears.3.weight": "model-00004-of-00004.safetensors",
29
+ "fuser.linears.4.bias": "model-00004-of-00004.safetensors",
30
+ "fuser.linears.4.weight": "model-00004-of-00004.safetensors",
31
+ "fuser.linears.5.bias": "model-00004-of-00004.safetensors",
32
+ "fuser.linears.5.weight": "model-00004-of-00004.safetensors",
33
+ "fuser.linears.6.bias": "model-00004-of-00004.safetensors",
34
+ "fuser.linears.6.weight": "model-00004-of-00004.safetensors",
35
+ "fuser.linears.7.bias": "model-00004-of-00004.safetensors",
36
+ "fuser.linears.7.weight": "model-00004-of-00004.safetensors",
37
+ "fuser.linears.8.bias": "model-00004-of-00004.safetensors",
38
+ "fuser.linears.8.weight": "model-00004-of-00004.safetensors",
39
+ "fuser.linears.9.bias": "model-00004-of-00004.safetensors",
40
+ "fuser.linears.9.weight": "model-00004-of-00004.safetensors",
41
  "layer_norm.bias": "model-00004-of-00004.safetensors",
42
  "layer_norm.weight": "model-00004-of-00004.safetensors",
43
  "learned_layer_weight": "model-00001-of-00004.safetensors",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59699c20e1a688f83b7fd22a794114528507d9486108d14371000973ff19a6af
3
  size 7672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537a51edfc2b5fa49fb8ac77d7cef18fe1c1b5fec55ff4c127e7cbd280efbadf
3
  size 7672