EchoNet-Synthetic / lvdm /config.json
HReynaud's picture
models batch 1
56c538a
raw
history blame contribute delete
989 Bytes
{
"_class_name": "UNetSpatioTemporalConditionModel",
"_diffusers_version": "0.27.2",
"addition_time_embed_dim": 1,
"block_out_channels": [
128,
256,
256,
512
],
"cross_attention_dim": 1,
"decay": 0.9999,
"down_block_types": [
"CrossAttnDownBlockSpatioTemporal",
"CrossAttnDownBlockSpatioTemporal",
"CrossAttnDownBlockSpatioTemporal",
"DownBlockSpatioTemporal"
],
"in_channels": 8,
"inv_gamma": 1.0,
"layers_per_block": 2,
"min_decay": 0.0,
"num_attention_heads": [
8,
16,
16,
32
],
"num_frames": 64,
"optimization_step": 60000,
"out_channels": 4,
"power": 0.6666666666666666,
"projection_class_embeddings_input_dim": 1,
"sample_size": 14,
"transformer_layers_per_block": 1,
"up_block_types": [
"UpBlockSpatioTemporal",
"CrossAttnUpBlockSpatioTemporal",
"CrossAttnUpBlockSpatioTemporal",
"CrossAttnUpBlockSpatioTemporal"
],
"update_after_step": 0,
"use_ema_warmup": false
}