h 32, l 16, g 8
Browse files
scripts/pretrain-model.yaml
CHANGED
@@ -8,7 +8,7 @@ model_config:
|
|
8 |
padded_vocab_size: 38400
|
9 |
vocab_size: 38400
|
10 |
block_size: 8192
|
11 |
-
n_layer:
|
12 |
n_head: 32
|
13 |
head_size: null
|
14 |
n_embd: 256
|
|
|
8 |
padded_vocab_size: 38400
|
9 |
vocab_size: 38400
|
10 |
block_size: 8192
|
11 |
+
n_layer: 16
|
12 |
n_head: 32
|
13 |
head_size: null
|
14 |
n_embd: 256
|