Saving weights and logs of step 10000
Browse files
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 497764120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7f89852d3a6a38756fae270a2926fabccc5ded47ed03b2bdf72323d30b48553
|
3 |
size 497764120
|
runs/events.out.tfevents.1642099734.t1v-n-42145f73-w-0.2317757.0.v2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbbf5988858cf76da919fb1758c11b0ecc821048cb24a60adc8a53b7f332f86b
|
3 |
+
size 15255487
|
runs/events.out.tfevents.1642208918.t1v-n-42145f73-w-0.2567321.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f34abfda811639f3d9abfb3c2ce67f5fda43568d82efbc314a084ecb090ebf6
|
3 |
+
size 1471449
|
start_train.sh
CHANGED
@@ -12,7 +12,7 @@ python3 run_clm_flax.py \
|
|
12 |
--block_size="512" \
|
13 |
--per_device_train_batch_size="32" \
|
14 |
--per_device_eval_batch_size="32" \
|
15 |
-
--preprocessing_num_workers="
|
16 |
--learning_rate="5e-3" \
|
17 |
--warmup_ratio="0.01" \
|
18 |
--cosine_decay \
|
|
|
12 |
--block_size="512" \
|
13 |
--per_device_train_batch_size="32" \
|
14 |
--per_device_eval_batch_size="32" \
|
15 |
+
--preprocessing_num_workers="1" \
|
16 |
--learning_rate="5e-3" \
|
17 |
--warmup_ratio="0.01" \
|
18 |
--cosine_decay \
|