p1atdev
/

afv03-lora

Model card Files Files and versions Community

afv03-lora / rope-8 /rope_migration.yml

p1atdev's picture

Upload rope_migration.yml

96dde3a verified about 2 months ago

1.53 kB

	model:
	checkpoint_path: "./models/aura_flow_0.3.bnb_nf4.safetensors"
	pretrained_model_name_or_path: fal/AuraFlow-v0.3

	dtype: bfloat16

	denoiser:
	use_flash_attn: true

	use_rope: True
	rope_theta: 10000
	rope_dim_sizes: [32, 112, 112]

	noise_prediction_loss: true
	migration_loss: true
	# prior_preservation_loss: true

	peft:
	type: lora
	rank: 4
	alpha: 1.0
	dropout: 0.0

	dtype: bfloat16

	# include_keys: [".attn.", ".mlp.", ".modC.", ".modCX.", ".modX."]
	include_keys: [".attn.", ".modC.", "modCX", ".modX."]
	exclude_keys: ["text_encoder", "vae", "t_embedder", "final_linear"]

	dataset:
	folder: "data/pexels-1k-random"
	num_repeats: 2
	batch_size: 2

	bucket_base_size: 1024
	step: 128
	min_size: 384
	do_upscale: false

	caption_processors: []

	optimizer:
	name: "schedulefree.RAdamScheduleFree"
	# name: "bitsandbytes.optim.AdamW8bit"
	args:
	lr: 0.005

	scheduler:
	# name: "torch.optim.lr_scheduler.ConstantLR"
	# args: {}

	tracker:
	project_name: "auraflow-rope-1"
	loggers:
	- wandb

	saving:
	strategy:
	per_epochs: 1
	per_steps: null
	save_last: true

	callbacks:
	- type: "hf_hub" # or "hf_hub" to push to hub
	name: "rope-8"
	save_dir: "./output/rope-8"

	hub_id: "p1atdev/afv03-lora"
	dir_in_repo: "rope-8"

	seed: 42
	num_train_epochs: 20

	trainer:
	# debug_mode: "1step"

	gradient_checkpointing: true

	torch_compile: true
	torch_compile_args:
	mode: max-autotune
	fullgraph: true
	fp32_matmul_precision: "medium"