Upload 4 files

Files changed (4) hide show

config.yaml ADDED Viewed

+pretrained_model_path: ./checkpoints/Bingsu/my-korean-stable-diffusion-v1-5
+output_dir: outputs/bear_guitar
+train_data:
+  video_path: data/man-surfing.mp4
+  prompt: A man is surfing
+  n_sample_frames: 24
+  width: 512
+  height: 512
+  sample_start_idx: 0
+  sample_frame_rate: 2
+validation_data:
+  prompts:
+  - 미키마우스가 서핑을 타고 있습니다
+  - 한 여자가 서핑을 타고 있습니다
+  - 흰색 옷을 입은 남자가 바다를 걷고 있습니다
+  video_length: 24
+  width: 512
+  height: 512
+  num_inference_steps: 20
+  guidance_scale: 12.5
+  use_inv_latent: true
+  num_inv_steps: 50
+validation_steps: 100
+trainable_modules:
+- attn1.to_q
+- attn2.to_q
+- attn_temp
+train_batch_size: 1
+max_train_steps: 400
+learning_rate: 3.0e-05
+scale_lr: false
+lr_scheduler: constant
+lr_warmup_steps: 0
+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_weight_decay: 0.01
+adam_epsilon: 1.0e-08
+max_grad_norm: 1.0
+gradient_accumulation_steps: 1
+gradient_checkpointing: true
+checkpointing_steps: 1000
+resume_from_checkpoint: null
+mixed_precision: fp16
+use_8bit_adam: false
+enable_xformers_memory_efficient_attention: true
+seed: 33

model_index.json ADDED Viewed

+{
+  "_class_name": "TuneAVideoPipeline",
+  "_diffusers_version": "0.11.1",
+  "scheduler": [
+    "diffusers",
+    "PNDMScheduler"
+  ],
+  "text_encoder": [
+    "transformers",
+    "CLIPTextModel"
+  ],
+  "tokenizer": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "unet": [
+    "models",
+    "UNet3DConditionModel"
+  ],
+  "vae": [
+    "diffusers",
+    "AutoencoderKL"
+  ]
+}

vae/config.json ADDED Viewed

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.11.1",
+  "_name_or_path": "./checkpoints/Bingsu/my-korean-stable-diffusion-v1-5",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "in_channels": 3,
+  "latent_channels": 4,
+  "layers_per_block": 2,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ]
+}

vae/diffusion_pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:081334a8acb2a2eecbee377823b2819669d45f56c593159a20d13754c96571fa
+size 167407601