abhinavp's picture
Training in progress, epoch 1, checkpoint
4cd200c verified
raw
history blame
549 Bytes
{
"architectures": [
"RNNForLanguageModeling"
],
"bidirectional": false,
"dropout_p": 0.1,
"emb_init_range": 0.1,
"embedding_dim": 1024,
"embedding_kwargs": {},
"hidden_dim": 1024,
"lin_init_range": 0.03125,
"lm_in_features": 1024,
"model_type": "rnn",
"num_layers": 2,
"output_last_state": false,
"output_recurrent_outputs": false,
"recur_init_range": 0.03125,
"rnn_kwargs": {},
"rnn_type": "LSTM",
"tie_weights": true,
"torch_dtype": "float32",
"transformers_version": "4.33.3",
"vocab_size": 50002
}