aapot
commited on
Commit
•
5732ee1
1
Parent(s):
671e7e3
Add 50k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_50000/checkpoint +3 -0
- checkpoint_50000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_50000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_50000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_50000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f724cd14d5474599b95a87f6a7a36bd944ea2b55e066da452824fc848273bc1
|
3 |
+
size 6520637
|
checkpoint_50000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3e96692323fd24a9c65b1a06b85b0093e43e02e85b20106a3e56a1f5bcc5fe7
|
3 |
+
size 2737
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a41f468fe3e35b918b5355761b2810fb7f531bcd36189086689f895df06f18c2
|
3 |
+
size 2751
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5b1d18e35769f2ce49ec94171a3bec60a0bf4d776d47ed48c5934c7139c052c
|
3 |
+
size 2806
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:094ef214d33d90eeb9f18cdf784fa16bcabe9028cd0b9b062739dba5f4470cf4
|
3 |
+
size 2831
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2912d931a5dfd82ee5a74605371a3bb8f66abe6c773442513209a6b14e08b4ce
|
3 |
+
size 2812
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a70f5906c5b7699b2250ff376f88bda30a015d2f0eb1ba759d1a2213abd11e7e
|
3 |
+
size 2728
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5145f51d35b1e4d144d34f8502f5c0ab5f64c1a3ddd8d1af4843518aa9257ffb
|
3 |
+
size 2860
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bad2fcfc70d772166d2e5b0450f624a135b397543b0ec3fb662325f70f62b8f6
|
3 |
+
size 2794
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d174ac83f49427c94a181334372c9b9cf204d772893ef909c0a36e8df670b66d
|
3 |
+
size 2779
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa6fabfbc55b6d9668b5675139006356ca5cc5df467e058ba8030c37fa365914
|
3 |
+
size 2814
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd6046bbf1ec82b67270cc6c4aeb8ee0750f26095c9a35a39c3f276cd9da4ff9
|
3 |
+
size 2789
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:820bf2163a79d635c480bbf2579543614f81a53c7b884458d75e8b7b45e7505f
|
3 |
+
size 2763
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f9f8844c18a85f412b07b6e70b5bccb6146f48ca7968d0c2b44fac349b8fba0
|
3 |
+
size 2814
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61e605f210cd71e14019bb654146dd10a2eaee28e0132894015b79bde9f24b77
|
3 |
+
size 2768
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68cdf5fcb72f26f4cd1f1bf4ae7a9167382ed9260c717e9c8d9558fd6fdd6cfa
|
3 |
+
size 2750
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c4b54cae1c024442a469ed1efc4ce38e6d4a66fe832f7b345cbd5912c59ede5
|
3 |
+
size 2807
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe1cb798be7e758c5065abcdf48ba2a601691d23e5c9d61f4ecbd74c57031acc
|
3 |
+
size 2795
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3453d5461e148be90d1e306fa487ce8102a57b121cf03bbbd7089f31ed72c08
|
3 |
+
size 2776
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa84df3c83befa5d689e5c3cbf86ca805000abdfa5a113ec598714b897ed43cb
|
3 |
+
size 2803
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca89f798caa0b7efcdde896e8ccdccb9020841bc73dec53c72a33af7d9f30f86
|
3 |
+
size 2786
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28867adfdcb5746eda8102af99bb781306e92d6ac363364fd42434dbdcf12ced
|
3 |
+
size 2735
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d1c6e8b23a91822dc3b9647ffa3a2f0997caf12c637223510c7b1b774c12d07
|
3 |
+
size 2815
|
checkpoint_50000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32dcef8c677195c9063ad527281a05ff6bb359e9693b8cf258ed608ddc14af50
|
3 |
+
size 2782
|
checkpoint_50000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_50000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd47458246ae5be72cc6138c6782673a3d068cacc3583b4ccae1b04c688d61f4
|
3 |
+
size 2713
|
checkpoint_50000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|