model: target: hy3dgen.shapegen.models.Hunyuan3DDiT params: in_channels: 64 context_in_dim: 1536 hidden_size: 1024 mlp_ratio: 4.0 num_heads: 16 depth: 16 depth_single_blocks: 32 axes_dim: [ 64 ] theta: 10000 qkv_bias: True vae: target: hy3dgen.shapegen.models.ShapeVAE params: num_latents: 3072 embed_dim: 64 num_freqs: 8 include_pi: false heads: 16 width: 1024 num_decoder_layers: 16 qkv_bias: false qk_norm: true scale_factor: 0.9990943042622529 conditioner: target: hy3dgen.shapegen.models.SingleImageEncoder params: main_image_encoder: type: DinoImageEncoder # dino giant kwargs: config: attention_probs_dropout_prob: 0.0 drop_path_rate: 0.0 hidden_act: gelu hidden_dropout_prob: 0.0 hidden_size: 1536 image_size: 518 initializer_range: 0.02 layer_norm_eps: 1.e-6 layerscale_value: 1.0 mlp_ratio: 4 model_type: dinov2 num_attention_heads: 24 num_channels: 3 num_hidden_layers: 40 patch_size: 14 qkv_bias: true torch_dtype: float32 use_swiglu_ffn: true image_size: 518 scheduler: target: hy3dgen.shapegen.schedulers.FlowMatchEulerDiscreteScheduler params: num_train_timesteps: 1000 image_processor: target: hy3dgen.shapegen.preprocessors.ImageProcessorV2 params: size: 512 border_ratio: 0.15 pipeline: target: hy3dgen.shapegen.pipelines.Hunyuan3DDiTFlowMatchingPipeline