Training in progress, step 100000
Browse files- babyslm/syntactic.txt +0 -0
- blimp_results.json +2 -2
- config.json +1 -1
- model.safetensors +2 -2
- training_args.bin +1 -1
babyslm/syntactic.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
blimp_results.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e53b54714a74a10d261403b1d01399b8c2605199b2196772adf5bcdb68a9ee96
|
3 |
+
size 80216307
|
config.json
CHANGED
@@ -13,7 +13,7 @@
|
|
13 |
"n_embd": 512,
|
14 |
"n_head": 8,
|
15 |
"n_inner": 2048,
|
16 |
-
"n_layer":
|
17 |
"n_positions": 256,
|
18 |
"reorder_and_upcast_attn": false,
|
19 |
"resid_pdrop": 0.1,
|
|
|
13 |
"n_embd": 512,
|
14 |
"n_head": 8,
|
15 |
"n_inner": 2048,
|
16 |
+
"n_layer": 6,
|
17 |
"n_positions": 256,
|
18 |
"reorder_and_upcast_attn": false,
|
19 |
"resid_pdrop": 0.1,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c3737c4075d348ec1397c6a34ff3599f64137f988eaf0282105e939ef63961f
|
3 |
+
size 108961160
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:975f4c8fc39f5136ba79137eff2767d6095d8cadb172037c87f30b58b803cd77
|
3 |
size 5368
|