kamilakesbi commited on
Commit
ff3e9e2
1 Parent(s): 03a636a

Upload folder using huggingface_hub

Browse files
config.yaml CHANGED
@@ -5,6 +5,7 @@ params:
5
  threshold: 0.7045654963945799
6
  segmentation:
7
  min_duration_off: 0.0
 
8
  pipeline:
9
  name: pyannote.audio.pipelines.speaker_diarization.SpeakerDiarization
10
  params:
 
5
  threshold: 0.7045654963945799
6
  segmentation:
7
  min_duration_off: 0.0
8
+ version: 3.1
9
  pipeline:
10
  name: pyannote.audio.pipelines.speaker_diarization.SpeakerDiarization
11
  params:
embedding/config.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _target_: pyannote.audio.models.embedding.wespeaker.WeSpeakerResNet34
3
+ dither: 0.0
4
+ frame_length: 25
5
+ frame_shift: 10
6
+ num_channels: 1
7
+ num_mel_bins: 80
8
+ sample_rate: 16000
9
+ use_energy: false
10
+ window_type: hamming
embedding/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6ebcd5526d688deb24b12eaae4774a6d8337c22bf7b7f25c1eaa1c345f6cae5
3
+ size 26644594
segmentation/config.yaml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _target_: pyannote.audio.models.segmentation.PyanNet.PyanNet
3
+ linear:
4
+ hidden_size: 128
5
+ num_layers: 2
6
+ lstm:
7
+ batch_first: true
8
+ bidirectional: true
9
+ dropout: 0.5
10
+ hidden_size: 128
11
+ monolithic: true
12
+ num_layers: 4
13
+ num_channels: 1
14
+ sample_rate: 16000
15
+ sincnet:
16
+ sample_rate: 16000
17
+ stride: 10
18
+ task:
19
+ duration: 10.0
20
+ max_speakers_per_chunk: 3
21
+ max_speakers_per_frame: 2
segmentation/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20f6de79768928db1564987c6fa644ad451eb9c1139999e68336721e49f9c52c
3
+ size 5912080