{ | |
"_from_model_config": true, | |
"_name_or_path": "openbmb/cpm-bee-10b", | |
"architectures": [ | |
"CpmBeeForWithTransform" | |
], | |
"auto_map": { | |
"AutoConfig": "configuration_cpmbee.CpmBeeConfig", | |
"AutoModel": "modeling_cpmbee.CpmBeeWithTransform", | |
"AutoTokenizer": "tokenization_viscpmbee.VisCpmBeeTokenizer" | |
}, | |
"vocab_size": 86583, | |
"hidden_size": 4096, | |
"dim_ff" : 10240, | |
"num_hidden_layers" : 48, | |
"num_attention_heads": 32, | |
"dim_head" : 128, | |
"dropout_p" : 0.0, | |
"position_bias_num_buckets" : 256, | |
"position_bias_num_segment_buckets": 256, | |
"position_bias_max_distance" : 2048, | |
"eps" : 1e-6, | |
"half" : false, | |
"model_type": "viscpmbee", | |
"unet_cross_attention_dim": 1024 | |
} | |