Cristhian2430 commited on
Commit
fbe969b
·
verified ·
1 Parent(s): e86e571

Upload WhisperForConditionalGeneration

Browse files
Files changed (3) hide show
  1. config.json +4 -7
  2. generation_config.json +15 -119
  3. model.safetensors +3 -0
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "openai/whisper-large-v3",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -9,7 +8,7 @@
9
  "attention_dropout": 0.0,
10
  "begin_suppress_tokens": [
11
  220,
12
- 50257
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
@@ -17,7 +16,7 @@
17
  "decoder_attention_heads": 20,
18
  "decoder_ffn_dim": 5120,
19
  "decoder_layerdrop": 0.0,
20
- "decoder_layers": 32,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
  "encoder_attention_heads": 20,
@@ -34,18 +33,16 @@
34
  "mask_time_length": 10,
35
  "mask_time_min_masks": 2,
36
  "mask_time_prob": 0.05,
37
- "max_length": 448,
38
  "max_source_positions": 1500,
39
  "max_target_positions": 448,
40
  "median_filter_width": 7,
41
  "model_type": "whisper",
42
  "num_hidden_layers": 32,
43
  "num_mel_bins": 128,
44
- "pad_token_id": 50256,
45
  "scale_embedding": false,
46
- "suppress_tokens": [],
47
  "torch_dtype": "float32",
48
- "transformers_version": "4.36.0.dev0",
49
  "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51866
 
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "gelu",
4
  "apply_spec_augment": false,
 
8
  "attention_dropout": 0.0,
9
  "begin_suppress_tokens": [
10
  220,
11
+ 50256
12
  ],
13
  "bos_token_id": 50257,
14
  "classifier_proj_size": 256,
 
16
  "decoder_attention_heads": 20,
17
  "decoder_ffn_dim": 5120,
18
  "decoder_layerdrop": 0.0,
19
+ "decoder_layers": 4,
20
  "decoder_start_token_id": 50258,
21
  "dropout": 0.0,
22
  "encoder_attention_heads": 20,
 
33
  "mask_time_length": 10,
34
  "mask_time_min_masks": 2,
35
  "mask_time_prob": 0.05,
 
36
  "max_source_positions": 1500,
37
  "max_target_positions": 448,
38
  "median_filter_width": 7,
39
  "model_type": "whisper",
40
  "num_hidden_layers": 32,
41
  "num_mel_bins": 128,
42
+ "pad_token_id": 50257,
43
  "scale_embedding": false,
 
44
  "torch_dtype": "float32",
45
+ "transformers_version": "4.56.0.dev0",
46
  "use_cache": true,
47
  "use_weighted_layer_sum": false,
48
  "vocab_size": 51866
generation_config.json CHANGED
@@ -1,44 +1,28 @@
1
  {
2
  "alignment_heads": [
3
  [
4
- 7,
5
- 0
6
- ],
7
- [
8
- 10,
9
- 17
10
- ],
11
- [
12
- 12,
13
- 18
14
  ],
15
  [
16
- 13,
17
- 12
18
  ],
19
  [
20
- 16,
21
- 1
22
  ],
23
  [
24
- 17,
25
- 14
26
  ],
27
  [
28
- 19,
29
  11
30
  ],
31
  [
32
- 21,
33
- 4
34
- ],
35
- [
36
- 24,
37
- 1
38
- ],
39
- [
40
- 25,
41
- 6
42
  ]
43
  ],
44
  "begin_suppress_tokens": [
@@ -161,104 +145,16 @@
161
  "<|yue|>": 50358,
162
  "<|zh|>": 50260
163
  },
164
- "max_initial_timestamp_index": 1,
165
  "max_length": 448,
166
  "no_timestamps_token_id": 50364,
167
  "pad_token_id": 50257,
 
168
  "return_timestamps": false,
169
- "suppress_tokens": [
170
- 1,
171
- 2,
172
- 7,
173
- 8,
174
- 9,
175
- 10,
176
- 14,
177
- 25,
178
- 26,
179
- 27,
180
- 28,
181
- 29,
182
- 31,
183
- 58,
184
- 59,
185
- 60,
186
- 61,
187
- 62,
188
- 63,
189
- 90,
190
- 91,
191
- 92,
192
- 93,
193
- 359,
194
- 503,
195
- 522,
196
- 542,
197
- 873,
198
- 893,
199
- 902,
200
- 918,
201
- 922,
202
- 931,
203
- 1350,
204
- 1853,
205
- 1982,
206
- 2460,
207
- 2627,
208
- 3246,
209
- 3253,
210
- 3268,
211
- 3536,
212
- 3846,
213
- 3961,
214
- 4183,
215
- 4667,
216
- 6585,
217
- 6647,
218
- 7273,
219
- 9061,
220
- 9383,
221
- 10428,
222
- 10929,
223
- 11938,
224
- 12033,
225
- 12331,
226
- 12562,
227
- 13793,
228
- 14157,
229
- 14635,
230
- 15265,
231
- 15618,
232
- 16553,
233
- 16604,
234
- 18362,
235
- 18956,
236
- 20075,
237
- 21675,
238
- 22520,
239
- 26130,
240
- 26161,
241
- 26435,
242
- 28279,
243
- 29464,
244
- 31650,
245
- 32302,
246
- 32470,
247
- 36865,
248
- 42863,
249
- 47425,
250
- 49870,
251
- 50254,
252
- 50258,
253
- 50359,
254
- 50360,
255
- 50361,
256
- 50362,
257
- 50363
258
- ],
259
  "task_to_id": {
260
  "transcribe": 50360,
261
  "translate": 50359
262
  },
263
- "transformers_version": "4.36.0.dev0"
264
  }
 
1
  {
2
  "alignment_heads": [
3
  [
4
+ 2,
5
+ 4
 
 
 
 
 
 
 
 
6
  ],
7
  [
8
+ 2,
9
+ 11
10
  ],
11
  [
12
+ 3,
13
+ 3
14
  ],
15
  [
16
+ 3,
17
+ 6
18
  ],
19
  [
20
+ 3,
21
  11
22
  ],
23
  [
24
+ 3,
25
+ 14
 
 
 
 
 
 
 
 
26
  ]
27
  ],
28
  "begin_suppress_tokens": [
 
145
  "<|yue|>": 50358,
146
  "<|zh|>": 50260
147
  },
148
+ "max_initial_timestamp_index": 50,
149
  "max_length": 448,
150
  "no_timestamps_token_id": 50364,
151
  "pad_token_id": 50257,
152
+ "prev_sot_token_id": 50362,
153
  "return_timestamps": false,
154
+ "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
155
  "task_to_id": {
156
  "transcribe": 50360,
157
  "translate": 50359
158
  },
159
+ "transformers_version": "4.56.0.dev0"
160
  }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f2ece75ee449a288d23b728b1bd32d4a150c3c71550301d2e780af1cde69c9a
3
+ size 3235581408