p1atdev commited on
Commit
7c3c1ec
·
verified ·
1 Parent(s): cf22c97

Upload rope_migration.yml

Browse files
Files changed (1) hide show
  1. rope-13/rope_migration.yml +102 -0
rope-13/rope_migration.yml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ checkpoint_path: "./models/aura_flow_0.3.bnb_nf4.safetensors"
3
+ pretrained_model_name_or_path: fal/AuraFlow-v0.3
4
+
5
+ dtype: bfloat16
6
+
7
+ denoiser:
8
+ use_flash_attn: true
9
+
10
+ use_rope: True
11
+ rope_theta: 10000
12
+ rope_dim_sizes: [32, 112, 112]
13
+
14
+ noise_prediction_loss: true
15
+ migration_loss: true
16
+ # prior_preservation_loss: true
17
+
18
+ peft:
19
+ type: lora
20
+ rank: 4
21
+ alpha: 1.0
22
+ dropout: 0.0
23
+
24
+ dtype: bfloat16
25
+
26
+ include_keys:
27
+ - ".mlp."
28
+ - ".attn."
29
+
30
+ exclude_keys:
31
+ - "text_encoder"
32
+ - "vae"
33
+ - "t_embedder"
34
+ - "final_linear"
35
+ - regex: .*\.mod[CX]{1,2} # exclude modulation layers (modC, modCX, modX)
36
+
37
+ dataset:
38
+ folder: "data/pexels-1k-random"
39
+ num_repeats: 2
40
+ batch_size: 2
41
+
42
+ bucket_base_size: 1024
43
+ step: 128
44
+ min_size: 384
45
+ do_upscale: false
46
+
47
+ caption_processors: []
48
+
49
+ optimizer:
50
+ name: "schedulefree.RAdamScheduleFree"
51
+ # name: "bitsandbytes.optim.AdamW8bit"
52
+ args:
53
+ lr: 0.005
54
+
55
+ scheduler:
56
+ # name: "torch.optim.lr_scheduler.ConstantLR"
57
+ # args: {}
58
+
59
+ tracker:
60
+ project_name: "auraflow-rope-1"
61
+ loggers:
62
+ - wandb
63
+
64
+ saving:
65
+ strategy:
66
+ per_epochs: 1
67
+ per_steps: null
68
+ save_last: true
69
+
70
+ callbacks:
71
+ - type: "hf_hub" # or "hf_hub" to push to hub
72
+ name: "rope-13"
73
+ save_dir: "./output/rope-13"
74
+
75
+ hub_id: "p1atdev/afv03-lora"
76
+ dir_in_repo: "rope-13"
77
+
78
+ preview:
79
+ strategy:
80
+ per_epochs: 1
81
+ per_steps: 100
82
+
83
+ callbacks:
84
+ - type: "discord"
85
+ url: "https://discord.com/api/webhooks/1327274657308610560/3T8Jj1DqkF7_T0eiYWThHu9dvqlcSYXPFFrGq8Dsd-k7lgp7MYyF5WN7KS65SW4K-v1l"
86
+
87
+ data:
88
+ path: "./projects/rope/preview.yml"
89
+
90
+ seed: 42
91
+ num_train_epochs: 20
92
+
93
+ trainer:
94
+ # debug_mode: "1step"
95
+
96
+ gradient_checkpointing: true
97
+
98
+ torch_compile: true
99
+ torch_compile_args:
100
+ mode: max-autotune
101
+ fullgraph: true
102
+ fp32_matmul_precision: "medium"