Auto Commit
Browse files- 0.pt +3 -0
- 0_cfg.json +1 -0
- 1.pt +3 -0
- 10.pt +3 -0
- 10_cfg.json +1 -0
- 11.pt +3 -0
- 11_cfg.json +1 -0
- 12.pt +3 -0
- 12_cfg.json +1 -0
- 13.pt +3 -0
- 13_cfg.json +1 -0
- 14.pt +3 -0
- 14_cfg.json +1 -0
- 15.pt +3 -0
- 15_cfg.json +1 -0
- 16.pt +3 -0
- 16_cfg.json +1 -0
- 17.pt +3 -0
- 17_cfg.json +1 -0
- 18.pt +3 -0
- 18_cfg.json +1 -0
- 19.pt +3 -0
- 19_cfg.json +1 -0
- 2.pt +3 -0
- 20.pt +3 -0
- 20_cfg.json +1 -0
- 21.pt +3 -0
- 21_cfg.json +1 -0
- 22.pt +3 -0
- 22_cfg.json +1 -0
- 23.pt +3 -0
- 23_cfg.json +1 -0
- 24.pt +3 -0
- 24_cfg.json +1 -0
- 25.pt +3 -0
- 25_cfg.json +1 -0
- 3.pt +3 -0
- 3_cfg.json +1 -0
- 4.pt +3 -0
- 4_cfg.json +1 -0
- 5.pt +3 -0
- 5_cfg.json +1 -0
- 6.pt +3 -0
- 6_cfg.json +1 -0
- 7.pt +3 -0
- 7_cfg.json +1 -0
- 8.pt +3 -0
- 8_cfg.json +1 -0
- 9.pt +3 -0
- 9_cfg.json +1 -0
0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a042fd2631d6f62ca7ec30dbd73181827069901902fdcfca6d0cf09d0a677b37
|
3 |
+
size 268510523
|
0_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 47, "batch_size": 1024, "model_batch_size": 128, "lr": 0.0001, "num_tokens": 10000000, "l1_coeff": 0.003, "wd": 0.01, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128}
|
1.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c204ed0887ac37f411dafb05ce66e93bc894cb85f7bfa0cd7260ce5246d6696c
|
3 |
+
size 268510459
|
10.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:728c81255ddb856a599e6d3618c2ce487261209976bfacfdb9eab4dcecba7435
|
3 |
+
size 268510529
|
10_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
11.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d82e9fa0699839cc8183f002ed4e2f6ba7d30df99ea0642022680b78b3de044b
|
3 |
+
size 268510529
|
11_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
12.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92df6dec158a428394ed58bab299970251d0e39f326f7d96a258ea58d97d560e
|
3 |
+
size 268510529
|
12_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
13.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f0bea930d6cb59496de1317c318290d3503bae5f0b5226d1bcb94238d09054
|
3 |
+
size 268510529
|
13_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
14.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46da744fbd3fc5e100fa5094a6b90020fb9b9f2ad8426aadd920359c5aa35b31
|
3 |
+
size 268510529
|
14_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
15.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54dcf18422f2ad27f86011001604126ede300c69766378df6603cbcf1e4007bc
|
3 |
+
size 268510529
|
15_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
16.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7e162389521b680d8e68e5a3c51edd9776f2dc36f34840d785dbd76990490de
|
3 |
+
size 268510529
|
16_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
17.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04f6206b4efdd98d867f53874a74294f3816fa99f1bbab0191d3c81cec172c31
|
3 |
+
size 268510529
|
17_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
18.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9435fbf3509d1bb0103cd4b85b35b3e4ca507015cac16921764fc5b41b662e4
|
3 |
+
size 268510529
|
18_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
19.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31fd3b874ce1605b97617f614342d5f9ccdab3eb390a2c998b081fa89ac73b71
|
3 |
+
size 268510529
|
19_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
2.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe6e48c1f15bdeafd8e31ce1c01650175d0013a79fe550f2bfc6ab068e76cea9
|
3 |
+
size 134255931
|
20.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9e20a19683d1448faccf77464b7096f682288afab302d7542540bce374f61eb
|
3 |
+
size 268510529
|
20_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
21.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:834da8142b939663d7b6e5fc5313ff397913aa85e4b8139a93f949b4fd752dcf
|
3 |
+
size 268510529
|
21_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
22.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:972a11b4c479f08356f70c9a9bf9e241ed7c8f65ec3c2af8bdc305d2be054950
|
3 |
+
size 268510529
|
22_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
23.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73c1741db7ea37c943009b96b9bffde23c3c70fd87d668ac36026d8f92cfc470
|
3 |
+
size 268510529
|
23_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
24.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74df28c3513cf8a80dde8b1da3e2a4230f1d7e51ff7b9a78e7129dafe87cd5e5
|
3 |
+
size 268510529
|
24_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
25.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9e5d2e691cef7bef044c6b5f91159cce6c67eadd8389638220a402075e1bf9c
|
3 |
+
size 268510529
|
25_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|
3.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaa431156b0e466a67d57a4849430b805f723ac39e1cce15d06f172097f887c1
|
3 |
+
size 134255931
|
3_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 47, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 10000000, "l1_coeff": 0.003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
4.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f5e61053dca12ded5deaeab1cacfe1bba4ca6f5ba9f7baabdf3691b72ed0333
|
3 |
+
size 268510523
|
4_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 47, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
5.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8ceaa3b26f97c975142dec66a6894e17b510eb641c7f90ae76084f3db75a600
|
3 |
+
size 268510523
|
5_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 47, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
6.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:208880c7aca2855e8ef2a3f30a4c41d0907b9df79413e7fefe3e4c2f54129eba
|
3 |
+
size 268510523
|
6_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 49, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
7.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2b0edd0f9921349640bde9ae0d22273b16aae6c83ae84cda3af45ef9c5c8666
|
3 |
+
size 268510523
|
7_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 50, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
8.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9e886e0b7618a9fc7ba005985287ea46680b2ed4b68f6638561c753caf15480
|
3 |
+
size 268510523
|
8_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 51, "batch_size": 4096, "buffer_mult": 512, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 2097152, "buffer_batches": 16384}
|
9.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:389eaf32ef10a144b28b2e2722cb83adf26eb53df3bddee27e31c67d88b7e9c5
|
3 |
+
size 268510523
|
9_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
|