{ | |
"d_model": 1024, | |
"decoder_attention_heads": 16, | |
"decoder_ffn_dim": 2730, | |
"decoder_layers": 12, | |
"decoder_start_token_id": 16384, | |
"encoder_attention_heads": 16, | |
"encoder_ffn_dim": 2730, | |
"encoder_layers": 12, | |
"encoder_vocab_size": 50264, | |
"image_length": 256, | |
"image_vocab_size": 16384, | |
"max_text_length": 64 | |
} | |