Commit
·
d739829
1
Parent(s):
03b47d0
PUsh fork of accent-id-commonaccent_xlsr-en-english
Browse files- hyperparams.yaml +23 -24
hyperparams.yaml
CHANGED
|
@@ -20,40 +20,39 @@ pretrained_path: Jzuluaga/accent-id-commonaccent_xlsr-en-english
|
|
| 20 |
encoder_dim: 1024
|
| 21 |
out_n_neurons: 16
|
| 22 |
|
| 23 |
-
wav2vec2:
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
|
| 27 |
-
|
|
|
|
| 28 |
|
| 29 |
avg_pool: !new:speechbrain.nnet.pooling.StatisticsPooling
|
| 30 |
-
|
| 31 |
|
| 32 |
output_mlp: !new:speechbrain.nnet.linear.Linear
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
|
| 37 |
model: !new:torch.nn.ModuleList
|
| 38 |
-
|
| 39 |
|
| 40 |
modules:
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
|
| 45 |
softmax: !new:speechbrain.nnet.activations.Softmax
|
| 46 |
-
|
| 47 |
-
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
| 48 |
|
|
|
|
| 49 |
|
| 50 |
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
-
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
|
|
|
| 20 |
encoder_dim: 1024
|
| 21 |
out_n_neurons: 16
|
| 22 |
|
| 23 |
+
wav2vec2:
|
| 24 |
+
!new:speechbrain.lobes.models.huggingface_transformers.wav2vec2.Wav2Vec2
|
| 25 |
+
source: !ref <wav2vec2_hub>
|
| 26 |
+
output_norm: True
|
| 27 |
+
freeze: True
|
| 28 |
+
save_path: wav2vec2_checkpoints
|
| 29 |
|
| 30 |
avg_pool: !new:speechbrain.nnet.pooling.StatisticsPooling
|
| 31 |
+
return_std: False
|
| 32 |
|
| 33 |
output_mlp: !new:speechbrain.nnet.linear.Linear
|
| 34 |
+
input_size: !ref <encoder_dim>
|
| 35 |
+
n_neurons: !ref <out_n_neurons>
|
| 36 |
+
bias: False
|
| 37 |
|
| 38 |
model: !new:torch.nn.ModuleList
|
| 39 |
+
- [!ref <output_mlp>]
|
| 40 |
|
| 41 |
modules:
|
| 42 |
+
wav2vec2: !ref <wav2vec2>
|
| 43 |
+
output_mlp: !ref <output_mlp>
|
| 44 |
+
avg_pool: !ref <avg_pool>
|
| 45 |
|
| 46 |
softmax: !new:speechbrain.nnet.activations.Softmax
|
|
|
|
|
|
|
| 47 |
|
| 48 |
+
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
| 49 |
|
| 50 |
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
| 51 |
+
loadables:
|
| 52 |
+
wav2vec2: !ref <wav2vec2>
|
| 53 |
+
model: !ref <model>
|
| 54 |
+
label_encoder: !ref <label_encoder>
|
| 55 |
+
paths:
|
| 56 |
+
wav2vec2: !ref <pretrained_path>/wav2vec2.ckpt
|
| 57 |
+
model: !ref <pretrained_path>/model.ckpt
|
| 58 |
+
label_encoder: !ref <pretrained_path>/label_encoder.txt
|
|
|