File size: 1,870 Bytes
33facbc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94

[DEFAULTS]

#name of the run
exp_name = F5

# the batch size
batch_size = 8 

# the chunk size
max_frames = 3000 
min_frames = 10

# number of CPU workers for the DataLoader
num_workers = 4

# the random seed
seed = 42

# Batches for gradient accumulation
accum_batches = 1

# Number of steps between checkpoints
checkpoint_every = 10000                              
                     
# trainer checkpoint file to restart training from
ckpt_path = ''

# model checkpoint file to start a new training run from
pretrained_ckpt_path = ''

# Checkpoint path for the pretransform model if needed
pretransform_ckpt_path = ''

# configuration model specifying model hyperparameters
model_config = ''

# configuration for datasets
dataset_config = ''

# directory to save the checkpoints in
save_dir = ''

# grad norm
max_grad_norm = 1.0

# grad accu
grad_accumulation_steps = 1

# lr
learning_rate = 7.5e-5

# epoch
epochs = 110 

# warmup steps
num_warmup_updates = 2000

# save checkpoint per steps
save_per_updates = 5000

# save last checkpoint per steps
last_per_steps = 5000

prompt_path = "/mnt/sfs/music/lance/style-lance-full|/mnt/sfs/music/lance/style-lance-cnen-music-second"
lrc_path = "/mnt/sfs/music/lance/lrc-lance-emb-full|/mnt/sfs/music/lance/lrc-lance-cnen-second"
latent_path = "/mnt/sfs/music/lance/latent-lance|/mnt/sfs/music/lance/latent-lance-cnen-music-second-1|/mnt/sfs/music/lance/latent-lance-cnen-music-second-2"

audio_drop_prob = 0.3
cond_drop_prob = 0.0
style_drop_prob = 0.1
lrc_drop_prob = 0.1

align_lyrics = 0
lyrics_slice = 0
parse_lyrics = 1
skip_empty_lyrics = 0
lyrics_shift = -1

use_style_prompt = 1

tokenizer_type = gpt2

reset_lr = 0

resumable_with_seed = 666

downsample_rate = 2048

grad_ckpt = 0

dataset_path = "/mnt/sfs/music/hkchen/workspace/F5-TTS-HW/filelists/music123latent_asred_bpmstyle_cnen_pure1"

pure_prob = 0.0