File size: 1,272 Bytes
e6a6383
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
{
    "model": "src.training.dcc_tf",
    "model_params":
    {
        "label_len": 41,
        "L": 32,
        "enc_dim": 512,
        "num_enc_layers": 10,
        "dec_dim": 256,
        "num_dec_layers": 1,
        "dec_buf_len": 13,
        "dec_chunk_size": 13,
        "out_buf_len": 4,
        "use_pos_enc": "true"
    },
    "train_data":
    {
        "input_dir": "data/FSDSoundScapes",
        "dset": "train",
        "sr": 44100,
        "resample_rate": null,
	"max_num_targets":3
    },
    "val_data":
    {
        "input_dir": "data/FSDSoundScapes",
        "dset": "val",
        "sr": 44100,
        "resample_rate": null,
	"max_num_targets":3
    },
    "test_data":
    {
        "input_dir": "data/FSDSoundScapes",
        "dset": "test",
        "sr": 44100,
        "resample_rate": null,
	"max_num_targets":3
    },
    "optim":
    {
        "lr": 5e-4,
        "weight_decay": 0.0
    },
    "lr_sched":
    {
        "mode": "max",
        "factor": 0.1,
        "patience": 5,
        "min_lr": 5e-6,
        "threshold": 0.1,
        "threshold_mode": "abs"
    },
    "base_metric": "scale_invariant_signal_noise_ratio",
    "fix_lr_epochs": 50,
    "epochs": 150,
    "batch_size": 16,
    "eval_batch_size": 64,
    "n_workers": 16
}