model: _target_: modules.gaudio.sv_encoder.SenseVoiceSmall specaug: _target_: modules.gaudio.sv_encoder.SpecAugLFR apply_freq_mask: true apply_time_mask: true apply_time_warp: false freq_mask_width_range: [0, 30] lfr_rate: 6 num_freq_mask: 1 num_time_mask: 1 time_mask_width_range: [0, 12] time_warp_mode: bicubic time_warp_window: 5 encoder: _target_: modules.gaudio.sv_encoder.SenseVoiceEncoderSmall attention_dropout_rate: 0.1 attention_heads: 4 dropout_rate: 0.1 kernel_size: 11 linear_units: 2048 normalize_before: true num_blocks: 50 output_size: 512 sanm_shfit: 0 tp_blocks: 20 input_size: 560 length_normalized_loss: true input_size: 560 vocab_size: 25055 sos: 1 eos: 2 ignore_id: -1