{ | |
"d_model": 2048, | |
"decoder_attention_heads": 32, | |
"decoder_ffn_dim": 4096, | |
"decoder_layers": 24, | |
"decoder_start_token_id": 16384, | |
"encoder_attention_heads": 32, | |
"encoder_ffn_dim": 4096, | |
"encoder_layers": 24, | |
"encoder_vocab_size": 50272, | |
"image_length": 256, | |
"image_vocab_size": 16415, | |
"max_text_length": 64 | |
} | |