{ | |
"_class_name": "MaskGiTUViT_v2", | |
"_version": "0.0.1", | |
"add_cond_embeds": true, | |
"add_micro_cond_embeds": true, | |
"attention_dropout": 0.0, | |
"block_num_heads": 12, | |
"block_out_channels": [ | |
768 | |
], | |
"codebook_size": 8192, | |
"cond_embed_dim": 768, | |
"encoder_hidden_size": 768, | |
"force_down_up_sample": true, | |
"hidden_dropout": 0.0, | |
"hidden_size": 1024, | |
"in_channels": 768, | |
"intermediate_size": 2816, | |
"layer_norm_eps": 1e-06, | |
"ln_elementwise_affine": true, | |
"mask_token_id": 8255, | |
"micro_cond_embed_dim": 1280, | |
"micro_cond_encode_dim": 256, | |
"norm_type": "rmsnorm", | |
"num_attention_heads": 16, | |
"num_hidden_layers": 22, | |
"num_res_blocks": 3, | |
"use_bias": false, | |
"use_fused_mlp": false, | |
"use_fused_residual_norm": false, | |
"vocab_size": 8256 | |
} | |