tyler commited on
Commit
9c88e9c
Β·
1 Parent(s): 1cd0a28
age_gender/w2v2-L-robust-6-age-gender.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75c5cc3debc2013215cee5f331a66b59bd7205da170fb61abab46fc4507df7be
3
+ size 363421332
hubert/DPHuBERT-sp0.75.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:384d72429163b79cd9f4deaf41aa2cbc990e7526b4430f2a22d40c5e70c14be7
3
+ size 99132650
hubert/hubert_base.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54b40fd2802423a5643779c4861af1e9ee9c1564dc9d32f54f20b5ffba7db96
3
+ size 189507909
hubert/hubert_base_12_768.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfb3e1787cecc78023fa40c7ace8897b7bcce093d8d4b5ea4357e3cee23f1f32
3
+ size 384166505
hubert/hubert_base_12_768_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:754d85e95f5a97ea45cac275875524b588529a1d926db140dbac3c8ce1fe0020
3
+ size 195568997
hubert/hubert_base_9_256_proj_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86b7dfb677ee0391e470b8372b13a57d5fcbb1709b6a609aacd4b1e50568406
3
+ size 151293032
hubert/hubert_base_ailia_2_output.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7aaee8684892f54ff181b46d2f4e8aef7684af76be7713346844b8de924dedf
3
+ size 293548373
rmvpe/crepe_onnx_full.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:119845c72c702e052e5262430f9d120bce46176689aa226c39d09dea5cc3a610
3
+ size 88984790
rmvpe/crepe_onnx_tiny.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91fc2a0fd10f965dbf7775995daf50e99273caedd7efd00001f23be649da1bc3
3
+ size 1955762
rmvpe/fcpe.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988522bdee2b0954ec5d43eb3fd6805c7a7d05cd8198a031e6ca67251bdbb872
3
+ size 43917245
rmvpe/fcpe_cents_include.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59e991f1077bbbadb222b718b0434360a1aff1b1916c943ef1285b996895e385
3
+ size 43768220
rmvpe/rmvpe.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5370e71ac80af8b4b7c793d27efd51fd8bf962de3a7ede0766dac0befa3660fd
3
+ size 361688443
rmvpe/rmvpe.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d62215f4306e3ca278246188607209f09af3dc77ed4232efdd069798c4ec193
3
+ size 181184272
rmvpe/rmvpe_230917.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19dc1809cf4cdb0a18db93441816bc327e14e5644b72eeaae5220560c6736fe2
3
+ size 368492925
rmvpe/rmvpe_inputs.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:339fcb7e1476b302e9aecef4a951e918c20852b2e871de5eea13b06e554e0a3a
3
+ size 33527
rmvpe/rmvpe_mel_include.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f0586308e36157f75b77c8591bf636d6719c0c4ba95f8faf3df479e7566219
3
+ size 362003174
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/__init__.py RENAMED
File without changes
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/data/__init__.py RENAMED
File without changes
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/data/silero_vad.onnx RENAMED
File without changes
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/hubconf.py RENAMED
File without changes
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/model.py RENAMED
File without changes
{speak_detect β†’ speak_detection}/snakers4_silero-vad_master/utils_vad.py RENAMED
@@ -132,31 +132,34 @@ class Validator():
132
 
133
  def read_audio(path: str,
134
  sampling_rate: int = 16000):
135
- list_backends = torchaudio.list_audio_backends()
136
-
137
- assert len(list_backends) > 0, 'The list of available backends is empty, please install backend manually. \
138
- \n Recommendations: \n \tSox (UNIX OS) \n \tSoundfile (Windows OS, UNIX OS) \n \tffmpeg (Windows OS, UNIX OS)'
139
-
140
- try:
141
- effects = [
142
- ['channels', '1'],
143
- ['rate', str(sampling_rate)]
144
- ]
145
-
146
- wav, sr = torchaudio.sox_effects.apply_effects_file(path, effects=effects)
147
- except:
148
- wav, sr = torchaudio.load(path)
149
-
150
- if wav.size(0) > 1:
151
- wav = wav.mean(dim=0, keepdim=True)
152
-
153
- if sr != sampling_rate:
154
- transform = torchaudio.transforms.Resample(orig_freq=sr,
155
- new_freq=sampling_rate)
156
- wav = transform(wav)
157
- sr = sampling_rate
158
-
159
- assert sr == sampling_rate
 
 
 
160
  return wav.squeeze(0)
161
 
162
 
 
132
 
133
  def read_audio(path: str,
134
  sampling_rate: int = 16000):
135
+ if isinstance(path, np.ndarray):
136
+ wav = torch.tensor(path.reshape(1, -1))
137
+ else:
138
+ list_backends = torchaudio.list_audio_backends()
139
+
140
+ assert len(list_backends) > 0, 'The list of available backends is empty, please install backend manually. \
141
+ \n Recommendations: \n \tSox (UNIX OS) \n \tSoundfile (Windows OS, UNIX OS) \n \tffmpeg (Windows OS, UNIX OS)'
142
+
143
+ try:
144
+ effects = [
145
+ ['channels', '1'],
146
+ ['rate', str(sampling_rate)]
147
+ ]
148
+
149
+ wav, sr = torchaudio.sox_effects.apply_effects_file(path, effects=effects)
150
+ except:
151
+ wav, sr = torchaudio.load(path)
152
+
153
+ if wav.size(0) > 1:
154
+ wav = wav.mean(dim=0, keepdim=True)
155
+
156
+ if sr != sampling_rate:
157
+ transform = torchaudio.transforms.Resample(orig_freq=sr,
158
+ new_freq=sampling_rate)
159
+ wav = transform(wav)
160
+ sr = sampling_rate
161
+
162
+ assert sr == sampling_rate
163
  return wav.squeeze(0)
164
 
165