{ "device": "cuda", "dropout": 0.2, "n_blocks": 4, "transformer_config": { "block_size": 250, "dropout": 0.2, "n_embd": 496, "n_head": 8 }, "vocab_size": 8010, "xlstm_config": { "batch_size": 8, "block_size": 250, "config_block": "msm", "device": "cuda", "n_embd": 496 } }