Update config.json
Browse files- config.json +0 -21
config.json
CHANGED
@@ -16,16 +16,7 @@
|
|
16 |
-1
|
17 |
],
|
18 |
"classifier_proj_size": 256,
|
19 |
-
"cnn_module_kernel": [
|
20 |
-
31,
|
21 |
-
31,
|
22 |
-
15,
|
23 |
-
15,
|
24 |
-
15,
|
25 |
-
31
|
26 |
-
],
|
27 |
"codevector_dim": 256,
|
28 |
-
"conformer_conv_dropout": 0.1,
|
29 |
"contrastive_logits_temperature": 0.1,
|
30 |
"conv_bias": false,
|
31 |
"conv_depthwise_kernel_size": 31,
|
@@ -56,12 +47,6 @@
|
|
56 |
2,
|
57 |
2
|
58 |
],
|
59 |
-
"csgu_activation": "identity",
|
60 |
-
"csgu_conv_dropout": 0.1,
|
61 |
-
"csgu_kernel_size": 31,
|
62 |
-
"csgu_use_linear_after_conv": false,
|
63 |
-
"ctc_loss_reduction": "sum",
|
64 |
-
"ctc_zero_infinity": false,
|
65 |
"diversity_loss_weight": 0.1,
|
66 |
"do_stable_layer_norm": true,
|
67 |
"downsampling_factor": [
|
@@ -89,7 +74,6 @@
|
|
89 |
256,
|
90 |
192
|
91 |
],
|
92 |
-
"eos_token_id": 2,
|
93 |
"feat_extract_activation": "gelu",
|
94 |
"feat_extract_norm": "layer",
|
95 |
"feat_proj_dropout": 0.0,
|
@@ -123,7 +107,6 @@
|
|
123 |
"mask_time_min_masks": 2,
|
124 |
"mask_time_prob": 0.05,
|
125 |
"max_source_positions": 5000,
|
126 |
-
"merge_conv_kernel": 31,
|
127 |
"model_type": "wav2vec2-zipformer",
|
128 |
"num_adapter_layers": 3,
|
129 |
"num_attention_heads": 8,
|
@@ -156,10 +139,8 @@
|
|
156 |
"pad_token_id": 0,
|
157 |
"pos_dim": 48,
|
158 |
"pos_head_dim": 4,
|
159 |
-
"position_embeddings_type": "relative",
|
160 |
"proj_codevector_dim": 256,
|
161 |
"query_head_dim": 32,
|
162 |
-
"rotary_embedding_base": 10000,
|
163 |
"tdnn_dilation": [
|
164 |
1,
|
165 |
2,
|
@@ -182,8 +163,6 @@
|
|
182 |
1
|
183 |
],
|
184 |
"transformers_version": "4.34.1",
|
185 |
-
"use_fbanks": false,
|
186 |
-
"use_macaron_ff": true,
|
187 |
"use_weighted_layer_sum": false,
|
188 |
"value_head_dim": 12,
|
189 |
"vocab_size": null,
|
|
|
16 |
-1
|
17 |
],
|
18 |
"classifier_proj_size": 256,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
"codevector_dim": 256,
|
|
|
20 |
"contrastive_logits_temperature": 0.1,
|
21 |
"conv_bias": false,
|
22 |
"conv_depthwise_kernel_size": 31,
|
|
|
47 |
2,
|
48 |
2
|
49 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
50 |
"diversity_loss_weight": 0.1,
|
51 |
"do_stable_layer_norm": true,
|
52 |
"downsampling_factor": [
|
|
|
74 |
256,
|
75 |
192
|
76 |
],
|
|
|
77 |
"feat_extract_activation": "gelu",
|
78 |
"feat_extract_norm": "layer",
|
79 |
"feat_proj_dropout": 0.0,
|
|
|
107 |
"mask_time_min_masks": 2,
|
108 |
"mask_time_prob": 0.05,
|
109 |
"max_source_positions": 5000,
|
|
|
110 |
"model_type": "wav2vec2-zipformer",
|
111 |
"num_adapter_layers": 3,
|
112 |
"num_attention_heads": 8,
|
|
|
139 |
"pad_token_id": 0,
|
140 |
"pos_dim": 48,
|
141 |
"pos_head_dim": 4,
|
|
|
142 |
"proj_codevector_dim": 256,
|
143 |
"query_head_dim": 32,
|
|
|
144 |
"tdnn_dilation": [
|
145 |
1,
|
146 |
2,
|
|
|
163 |
1
|
164 |
],
|
165 |
"transformers_version": "4.34.1",
|
|
|
|
|
166 |
"use_weighted_layer_sum": false,
|
167 |
"value_head_dim": 12,
|
168 |
"vocab_size": null,
|