gorinars commited on
Commit
a57d74a
·
1 Parent(s): b429bbc

first commit

Browse files
.gitattributes CHANGED
@@ -32,3 +32,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ embedding_model.ckpt filter=lfs diff=lfs merge=lfs -text
36
+ normalizer.ckpt filter=lfs diff=lfs merge=lfs -text
37
+ projector.ckpt filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "speechbrain_interface": "SpeakerRecognition"
3
+ }
embedding_model.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca6f7dcf4eb97e68fb0989e3fbc9c667c60eaa0c598753e86e7b07bac0729755
3
+ size 301999678
hyperparams.yaml ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ############################################################################
2
+ # Model: ECAPA big for Speaker verification
3
+ # ############################################################################
4
+
5
+ # Feature parameters
6
+ n_mels: 80
7
+
8
+ # Pretrain folder (HuggingFace)
9
+ pretrained_path: gorinars/sb-cssl-offline-wp
10
+
11
+ # Output parameters
12
+ out_n_neurons: 308
13
+
14
+ # Model params
15
+ compute_features: !new:speechbrain.lobes.features.Fbank
16
+ n_mels: 80
17
+ left_frames: 0
18
+ right_frames: 0
19
+ deltas: false
20
+ sample_rate: 16000
21
+ n_fft: 400
22
+ win_length: 25
23
+ hop_length: 10
24
+ f_min: 0
25
+
26
+
27
+ mean_var_norm: !new:speechbrain.processing.features.InputNormalization
28
+ norm_type: sentence
29
+ std_norm: False
30
+
31
+ classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
32
+ input_size: 2048
33
+ out_neurons: !ref <out_n_neurons>
34
+
35
+ embedding_model: !new:speechbrain.nnet.containers.LengthsCapableSequential
36
+ input_shape: [null, 1, null]
37
+ embedding: !new:crytorch.models.components.pann.Cnn14
38
+ mel_bins: 80
39
+ emb_dim: 2048
40
+ norm_type: bn
41
+ projector: !new:crytorch.models.components.pann.SimSiamProjector
42
+ input_size: 2048
43
+ hidden_size: 2048
44
+ output_size: 2048
45
+ norm_type: bn
46
+
47
+ modules:
48
+ compute_features: !ref <compute_features>
49
+ mean_var_norm: !ref <mean_var_norm>
50
+ embedding_model: !ref <embedding_model>
51
+ classifier: !ref <classifier>
52
+
53
+ label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
54
+
55
+
56
+ pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
57
+ loadables:
58
+ embedding: !ref <embedding_model.embedding>
59
+ projector: !ref <embedding_model.projector>
60
+ paths:
61
+ embedding: !ref <pretrained_path>/embedding_model.ckpt
62
+ projector: !ref <pretrained_path>/projector.ckpt
63
+
64
+
normalizer.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01dd629a2a24b29ad133b15930494e168114b788c4d7579ac2862e3d406e00fb
3
+ size 1063
projector.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6918979197eb1af1eed53eb64405e08730f91fc1742707dc1bf821dbef7ec2fa
3
+ size 33640379