Transformers
dragonSwing commited on
Commit
78e0d8f
·
1 Parent(s): 09e18b1

Update model

Browse files

Signed-off-by: Binh Le <[email protected]>

classifier.ckpt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1c5cf560dc904388ca459804ce8ee11944b3edc102a146d2a7c3c3ea1b3b67b
3
- size 9067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:420ed305f44ddf60cd109627682c75c98b76a45c15b0cd43d44606a867137289
3
+ size 5995
embedding_model.ckpt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0766e6aba5bd68e4a080116bb8ae17afc616284d1c2a50a22d67202b56e73b11
3
- size 1065702
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85c18d1b214d7bb56ab3748e45ba339e0893f9baeb516ebb7e65aeec7b540123
3
+ size 798438
hyperparams.yaml CHANGED
@@ -9,7 +9,7 @@ pretrained_path: /content/drive/MyDrive/audify/inference
9
  n_mels: 80
10
 
11
  # Output parameters
12
- out_n_neurons: 4 # Possible languages in the dataset
13
 
14
  # Model params
15
  compute_features: !new:speechbrain.lobes.features.Fbank
@@ -24,7 +24,7 @@ CNN: !new:speechbrain.lobes.models.convolution.ConvolutionFrontEnd
24
  input_shape: (null, null, 80)
25
  num_blocks: 3
26
  num_layers_per_block: 1
27
- out_channels: (128, 256, 512)
28
  kernel_sizes: (3, 3, 1)
29
  strides: (2, 2, 1)
30
  residuals: (False, False, False)
@@ -42,7 +42,7 @@ embedding_model: !new:speechbrain.nnet.containers.LengthsCapableSequential
42
  pooling: !ref <pooling>
43
 
44
  classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
45
- input_size: 512
46
  out_neurons: !ref <out_n_neurons>
47
 
48
  modules:
 
9
  n_mels: 80
10
 
11
  # Output parameters
12
+ out_n_neurons: 5 # Possible languages in the dataset
13
 
14
  # Model params
15
  compute_features: !new:speechbrain.lobes.features.Fbank
 
24
  input_shape: (null, null, 80)
25
  num_blocks: 3
26
  num_layers_per_block: 1
27
+ out_channels: (128, 256, 256)
28
  kernel_sizes: (3, 3, 1)
29
  strides: (2, 2, 1)
30
  residuals: (False, False, False)
 
42
  pooling: !ref <pooling>
43
 
44
  classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
45
+ input_size: 256
46
  out_neurons: !ref <out_n_neurons>
47
 
48
  modules:
label_encoder.txt CHANGED
@@ -1,6 +1,7 @@
1
- 'speech' => 0
2
- 'noisy_speech' => 1
3
- 'corrupted' => 2
4
  'music' => 3
 
5
  ================
6
  'starting_index' => 0
 
1
+ 'clean' => 0
2
+ 'noisy' => 1
3
+ 'corrupt' => 2
4
  'music' => 3
5
+ 'background' => 4
6
  ================
7
  'starting_index' => 0