{ | |
"_class_name": "MaskGiTUViT_v2", | |
"_version": "0.0.1", | |
"adapter_proj_dim": 32, | |
"add_cond_embeds": true, | |
"add_micro_cond_embeds": true, | |
"attention_dropout": 0.0, | |
"block_num_heads": 12, | |
"block_out_channels": [ | |
768 | |
], | |
"codebook_size": 8192, | |
"cond_embed_dim": 768, | |
"decay": 0.9999, | |
"encoder_hidden_size": 768, | |
"force_down_up_sample": true, | |
"hidden_dropout": 0.0, | |
"hidden_size": 1024, | |
"in_channels": 768, | |
"intermediate_size": 2816, | |
"inv_gamma": 1.0, | |
"is_adapter_shared": false, | |
"layer_norm_eps": 1e-06, | |
"ln_elementwise_affine": true, | |
"mask_token_id": 8255, | |
"micro_cond_embed_dim": 1280, | |
"micro_cond_encode_dim": 256, | |
"min_decay": 0.0, | |
"norm_type": "rmsnorm", | |
"num_attention_heads": 16, | |
"num_hidden_layers": 22, | |
"num_res_blocks": 3, | |
"optimization_step": 600, | |
"power": 0.6666666666666666, | |
"update_after_step": 0, | |
"use_adapter": true, | |
"use_bias": false, | |
"use_ema_warmup": false, | |
"use_fused_mlp": false, | |
"use_fused_residual_norm": true, | |
"vocab_size": 8256 | |
} | |