num_layers: 32 | |
num_heads: 8 | |
d_model: 256 | |
T: 16 | |
S: 256 | |
image_vocab_size: 262144 | |
use_mup: false | |
num_factored_vocabs: 2 | |
factored_vocab_size: 512 | |
max_corrupt_rate: 0.2 | |
non_mlm_ratio: 0.5 | |
num_prompt_frames: 8 | |
qkv_bias: false | |
proj_bias: true | |
attn_drop: 0 | |
qk_norm: false | |
mlp_ratio: 4 | |
mlp_drop: 0 | |
mlp_bias: true |