Auto Commit
Browse files- 26.pt +3 -0
- 26_cfg.json +1 -0
- 27.pt +3 -0
- 27_cfg.json +1 -0
- 28.pt +3 -0
- 28_cfg.json +1 -0
- 29.pt +3 -0
- 29_cfg.json +1 -0
- 30.pt +3 -0
- 30_cfg.json +1 -0
- 31.pt +3 -0
- 31_cfg.json +1 -0
- 32.pt +3 -0
- 32_cfg.json +1 -0
- 33.pt +3 -0
- 33_cfg.json +1 -0
- 34.pt +3 -0
- 34_cfg.json +1 -0
- 35.pt +3 -0
- 35_cfg.json +1 -0
- 36.pt +3 -0
- 36_cfg.json +1 -0
- 37.pt +3 -0
- 37_cfg.json +1 -0
- 38.pt +3 -0
- 38_cfg.json +1 -0
- 39.pt +3 -0
- 39_cfg.json +1 -0
- 40.pt +3 -0
- 40_cfg.json +1 -0
- 41.pt +3 -0
- 41_cfg.json +1 -0
- 42.pt +3 -0
- 42_cfg.json +1 -0
- 43.pt +3 -0
- 43_cfg.json +1 -0
- 44.pt +3 -0
- 44_cfg.json +1 -0
- 45.pt +3 -0
- 45_cfg.json +1 -0
- 46.pt +3 -0
- 46_cfg.json +1 -0
- 47.pt +3 -0
- 47_cfg.json +1 -0
26.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a15430d658f85c828bbc8b13935703be5e9b0bdf4aeda9e4bdca0086262a05c
|
3 |
+
size 268510529
|
26_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
27.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e71a4f89a66a4b7c23c94e1693dd8f9e5e3dcd994e39aea54f5e60b65ad2ed3c
|
3 |
+
size 268510529
|
27_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
28.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac0377f18a4b6c5d66ef8b4d9922c5280a1d395f659295200148671ad0ee7253
|
3 |
+
size 268510529
|
28_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
29.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1be40582e8b1afa58742846323c30cd2361e1b73c63da3f3495bb95e4faa87f9
|
3 |
+
size 268510529
|
29_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
30.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:582ff82a7fc23db58c5b67bc3f7b3ceddf496cc91f9e208a79e8270379d2bb75
|
3 |
+
size 268510529
|
30_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
31.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9716596386d8e01357ad4f672546f77f74635a33c44d8ff83ed97b92c5071526
|
3 |
+
size 268510529
|
31_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
32.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1b24bebcd0575ebf8129e4bf75fd1b22c78eee5dc3ccf2d6525bf40dfed655b
|
3 |
+
size 268510529
|
32_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
33.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5729f67d753baab362565d4919893b9370f7f3df61ba4e6bc46df460422473a
|
3 |
+
size 268510529
|
33_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
34.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b2c212c37ed2d7d0e79542d21392588756f4d5dd2318ad962b12b366f8be4c7
|
3 |
+
size 268510529
|
34_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
35.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2286cdaad50e6786721239273b255a45754ed37c45b4f1f16640defbc27d8e3b
|
3 |
+
size 268510529
|
35_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
36.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0ee72407e569a6b30c70c4e618477a0aa10f44a3df4bf2ee59bd2d4fabfdcea
|
3 |
+
size 268510529
|
36_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
37.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef5847874fbe0b8bbb163605db29e40a13d775bdb57c99e46c29f7242e28d587
|
3 |
+
size 268510529
|
37_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
38.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bc9a27cf67da3ea2aa79ad69728425cec111e0b5d88ffa97b53b61a8abd72bf
|
3 |
+
size 268510529
|
38_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
39.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7d2d51a6be313d0004500df3316823393e3e2219e2cd56362af9d6545f94b00
|
3 |
+
size 268510529
|
39_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
40.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19304e5c419a46b2d32fa9ac3122164eb33ffcf45a91aa278c35dffb1a2079c1
|
3 |
+
size 268510529
|
40_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
41.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e3f311631023ab5669fca728425394eb4b41150b8be59f1e70f744774cdc533
|
3 |
+
size 268510529
|
41_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
42.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aa702ddfadd82423aea11e328d6f4b276b5ed431a0fefa8db40182efd3ac1d1
|
3 |
+
size 268510529
|
42_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
43.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98961532116608ec7eb5764a176bcb4e30693677c10c586f09719043c4c7be90
|
3 |
+
size 268510529
|
43_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
44.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cad4fb29ec6f8eb70f9ecb7037c8dad50d2fdceaa4dd9473815ee411fafd0902
|
3 |
+
size 268510529
|
44_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
45.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea553092d14f6404ebee511161cb03e92188026ff34ba1b3d6653f8c48cfb1f7
|
3 |
+
size 268510529
|
45_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
46.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f08d675863e1b63b573a44fd0b488d3944472e1207e10c6e1f94462c5d38a7da
|
3 |
+
size 268510529
|
46_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
47.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05fff1837dbc55b5bda590721418bb358ab330bee666763c7a09debf5e46c7cc
|
3 |
+
size 268510529
|
47_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|