Commit
·
78e0d8f
1
Parent(s):
09e18b1
Update model
Browse filesSigned-off-by: Binh Le <[email protected]>
- classifier.ckpt +2 -2
- embedding_model.ckpt +2 -2
- hyperparams.yaml +3 -3
- label_encoder.txt +4 -3
classifier.ckpt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:420ed305f44ddf60cd109627682c75c98b76a45c15b0cd43d44606a867137289
|
3 |
+
size 5995
|
embedding_model.ckpt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85c18d1b214d7bb56ab3748e45ba339e0893f9baeb516ebb7e65aeec7b540123
|
3 |
+
size 798438
|
hyperparams.yaml
CHANGED
@@ -9,7 +9,7 @@ pretrained_path: /content/drive/MyDrive/audify/inference
|
|
9 |
n_mels: 80
|
10 |
|
11 |
# Output parameters
|
12 |
-
out_n_neurons:
|
13 |
|
14 |
# Model params
|
15 |
compute_features: !new:speechbrain.lobes.features.Fbank
|
@@ -24,7 +24,7 @@ CNN: !new:speechbrain.lobes.models.convolution.ConvolutionFrontEnd
|
|
24 |
input_shape: (null, null, 80)
|
25 |
num_blocks: 3
|
26 |
num_layers_per_block: 1
|
27 |
-
out_channels: (128, 256,
|
28 |
kernel_sizes: (3, 3, 1)
|
29 |
strides: (2, 2, 1)
|
30 |
residuals: (False, False, False)
|
@@ -42,7 +42,7 @@ embedding_model: !new:speechbrain.nnet.containers.LengthsCapableSequential
|
|
42 |
pooling: !ref <pooling>
|
43 |
|
44 |
classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
|
45 |
-
input_size:
|
46 |
out_neurons: !ref <out_n_neurons>
|
47 |
|
48 |
modules:
|
|
|
9 |
n_mels: 80
|
10 |
|
11 |
# Output parameters
|
12 |
+
out_n_neurons: 5 # Possible languages in the dataset
|
13 |
|
14 |
# Model params
|
15 |
compute_features: !new:speechbrain.lobes.features.Fbank
|
|
|
24 |
input_shape: (null, null, 80)
|
25 |
num_blocks: 3
|
26 |
num_layers_per_block: 1
|
27 |
+
out_channels: (128, 256, 256)
|
28 |
kernel_sizes: (3, 3, 1)
|
29 |
strides: (2, 2, 1)
|
30 |
residuals: (False, False, False)
|
|
|
42 |
pooling: !ref <pooling>
|
43 |
|
44 |
classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
|
45 |
+
input_size: 256
|
46 |
out_neurons: !ref <out_n_neurons>
|
47 |
|
48 |
modules:
|
label_encoder.txt
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
-
'
|
2 |
-
'
|
3 |
-
'
|
4 |
'music' => 3
|
|
|
5 |
================
|
6 |
'starting_index' => 0
|
|
|
1 |
+
'clean' => 0
|
2 |
+
'noisy' => 1
|
3 |
+
'corrupt' => 2
|
4 |
'music' => 3
|
5 |
+
'background' => 4
|
6 |
================
|
7 |
'starting_index' => 0
|