File size: 1,293 Bytes
3a2565f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
additional_config: null
allow_cache: true
best_model_criterion:
  key: utt_SRCC
  order: highest
collater_type: NonIntrusiveCollater
config: conf/ssl-mos-wav2vec2.yaml
dataset_type: NonIntrusiveDataset
dev_csv_path: data/nisqa_dev.csv
distributed: false
eval_and_save_interval_steps: 100
grad_norm: 1.0
inference_mode: mean_net
init_checkpoint: ''
keep_nbest_models: 5
listener_score_criterions: null
log_interval_steps: 100
mean_score_criterions:
- criterion_params:
    masked_loss: false
    order: 1
    tau: 0.5
  criterion_type: ScalarLoss
  criterion_weight: 1.0
model_input: waveform
model_params:
  mean_net_dnn_dim: 64
  mean_net_output_type: scalar
  mean_net_range_clipping: true
  s3prl_name: wav2vec2
  ssl_model_layer_idx: -1
  ssl_model_output_dim: 768
  ssl_module: s3prl
  use_listener_modeling: false
  use_mean_listener: false
model_type: SSLMOS
num_workers: 0
optimizer_params:
  lr: 0.001
  momentum: 0.9
optimizer_type: SGD
outdir: exp/ssl-mos-wav2vec2-3337
padding_mode: repetitive
patience: 20
pin_memory: true
rank: 0
resume: ''
sampling_rate: 16000
scheduler_type: null
seed: 3337
test_batch_size: 1
train_batch_size: 16
train_csv_path: data/nisqa_train.csv
train_max_steps: 100000
trainer_type: NonIntrusiveEstimatorTrainer
verbose: 1
version: 0.1.0
wav_only: true