indiejoseph commited on
Commit
9d9ba26
1 Parent(s): 6c71261

Model save

Browse files
README.md CHANGED
@@ -1,9 +1,6 @@
1
  ---
2
- language:
3
- - zh
4
- - yue
5
  license: mit
6
- base_model: facebook/mbart-large-50
7
  tags:
8
  - generated_from_trainer
9
  model-index:
@@ -16,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # mbart-translation-zh-yue
18
 
19
- This model is a fine-tuned version of [facebook/mbart-large-50](https://huggingface.co/facebook/mbart-large-50) on the None dataset.
20
 
21
  ## Model description
22
 
@@ -36,14 +33,12 @@ More information needed
36
 
37
  The following hyperparameters were used during training:
38
  - learning_rate: 5e-05
39
- - train_batch_size: 8
40
  - eval_batch_size: 8
41
  - seed: 42
42
- - gradient_accumulation_steps: 2
43
- - total_train_batch_size: 16
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
- - num_epochs: 4.0
47
 
48
  ### Training results
49
 
@@ -51,7 +46,7 @@ The following hyperparameters were used during training:
51
 
52
  ### Framework versions
53
 
54
- - Transformers 4.33.2
55
  - Pytorch 2.0.1+cu118
56
  - Datasets 2.14.5
57
- - Tokenizers 0.13.3
 
1
  ---
 
 
 
2
  license: mit
3
+ base_model: indiejoseph/mbart-translation-zh-yue
4
  tags:
5
  - generated_from_trainer
6
  model-index:
 
13
 
14
  # mbart-translation-zh-yue
15
 
16
+ This model is a fine-tuned version of [indiejoseph/mbart-translation-zh-yue](https://huggingface.co/indiejoseph/mbart-translation-zh-yue) on the None dataset.
17
 
18
  ## Model description
19
 
 
33
 
34
  The following hyperparameters were used during training:
35
  - learning_rate: 5e-05
36
+ - train_batch_size: 16
37
  - eval_batch_size: 8
38
  - seed: 42
 
 
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 1.0
42
 
43
  ### Training results
44
 
 
46
 
47
  ### Framework versions
48
 
49
+ - Transformers 4.34.0.dev0
50
  - Pytorch 2.0.1+cu118
51
  - Datasets 2.14.5
52
+ - Tokenizers 0.14.0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "facebook/mbart-large-50",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
@@ -52,7 +52,7 @@
52
  "static_position_embeddings": false,
53
  "tokenizer_class": "MBart50Tokenizer",
54
  "torch_dtype": "float32",
55
- "transformers_version": "4.33.2",
56
  "use_cache": true,
57
  "vocab_size": 250054
58
  }
 
1
  {
2
+ "_name_or_path": "indiejoseph/mbart-translation-zh-yue",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
 
52
  "static_position_embeddings": false,
53
  "tokenizer_class": "MBart50Tokenizer",
54
  "torch_dtype": "float32",
55
+ "transformers_version": "4.34.0.dev0",
56
  "use_cache": true,
57
  "vocab_size": 250054
58
  }
generation_config.json CHANGED
@@ -8,5 +8,5 @@
8
  "max_length": 200,
9
  "num_beams": 5,
10
  "pad_token_id": 1,
11
- "transformers_version": "4.33.2"
12
  }
 
8
  "max_length": 200,
9
  "num_beams": 5,
10
  "pad_token_id": 1,
11
+ "transformers_version": "4.34.0.dev0"
12
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e8d1833544d1118d34229844f39dc521fc94fd250db234f6751322d3a9e122c
3
  size 2444694045
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae98478e44316e541dfed712f137e0432a905fe9308ec799d02e39ed2bc894d2
3
  size 2444694045
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f785da5a9277ae8a1031e2b8ab37683590d02b249b2b55e72fdc971bc94746f1
3
- size 17109735
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66bb383f85ae5c8e1a08f6a9be4d484340fb75419fe506aab6c7d1ea1ebd573b
3
+ size 17094307
tokenizer_config.json CHANGED
@@ -1,4 +1,462 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "additional_special_tokens": [
3
  "ar_AR",
4
  "cs_CZ",
@@ -57,14 +515,7 @@
57
  "clean_up_tokenization_spaces": true,
58
  "cls_token": "<s>",
59
  "eos_token": "</s>",
60
- "mask_token": {
61
- "__type": "AddedToken",
62
- "content": "<mask>",
63
- "lstrip": true,
64
- "normalized": true,
65
- "rstrip": false,
66
- "single_word": false
67
- },
68
  "model_max_length": 1024,
69
  "pad_token": "<pad>",
70
  "sep_token": "</s>",
 
1
  {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "ar_AR",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": true,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "250002": {
44
+ "content": "cs_CZ",
45
+ "lstrip": true,
46
+ "normalized": false,
47
+ "rstrip": true,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "250003": {
52
+ "content": "de_DE",
53
+ "lstrip": true,
54
+ "normalized": false,
55
+ "rstrip": true,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "250004": {
60
+ "content": "en_XX",
61
+ "lstrip": true,
62
+ "normalized": false,
63
+ "rstrip": true,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "250005": {
68
+ "content": "es_XX",
69
+ "lstrip": true,
70
+ "normalized": false,
71
+ "rstrip": true,
72
+ "single_word": false,
73
+ "special": true
74
+ },
75
+ "250006": {
76
+ "content": "et_EE",
77
+ "lstrip": true,
78
+ "normalized": false,
79
+ "rstrip": true,
80
+ "single_word": false,
81
+ "special": true
82
+ },
83
+ "250007": {
84
+ "content": "fi_FI",
85
+ "lstrip": true,
86
+ "normalized": false,
87
+ "rstrip": true,
88
+ "single_word": false,
89
+ "special": true
90
+ },
91
+ "250008": {
92
+ "content": "fr_XX",
93
+ "lstrip": true,
94
+ "normalized": false,
95
+ "rstrip": true,
96
+ "single_word": false,
97
+ "special": true
98
+ },
99
+ "250009": {
100
+ "content": "gu_IN",
101
+ "lstrip": true,
102
+ "normalized": false,
103
+ "rstrip": true,
104
+ "single_word": false,
105
+ "special": true
106
+ },
107
+ "250010": {
108
+ "content": "hi_IN",
109
+ "lstrip": true,
110
+ "normalized": false,
111
+ "rstrip": true,
112
+ "single_word": false,
113
+ "special": true
114
+ },
115
+ "250011": {
116
+ "content": "it_IT",
117
+ "lstrip": true,
118
+ "normalized": false,
119
+ "rstrip": true,
120
+ "single_word": false,
121
+ "special": true
122
+ },
123
+ "250012": {
124
+ "content": "ja_XX",
125
+ "lstrip": true,
126
+ "normalized": false,
127
+ "rstrip": true,
128
+ "single_word": false,
129
+ "special": true
130
+ },
131
+ "250013": {
132
+ "content": "kk_KZ",
133
+ "lstrip": true,
134
+ "normalized": false,
135
+ "rstrip": true,
136
+ "single_word": false,
137
+ "special": true
138
+ },
139
+ "250014": {
140
+ "content": "ko_KR",
141
+ "lstrip": true,
142
+ "normalized": false,
143
+ "rstrip": true,
144
+ "single_word": false,
145
+ "special": true
146
+ },
147
+ "250015": {
148
+ "content": "lt_LT",
149
+ "lstrip": true,
150
+ "normalized": false,
151
+ "rstrip": true,
152
+ "single_word": false,
153
+ "special": true
154
+ },
155
+ "250016": {
156
+ "content": "lv_LV",
157
+ "lstrip": true,
158
+ "normalized": false,
159
+ "rstrip": true,
160
+ "single_word": false,
161
+ "special": true
162
+ },
163
+ "250017": {
164
+ "content": "my_MM",
165
+ "lstrip": true,
166
+ "normalized": false,
167
+ "rstrip": true,
168
+ "single_word": false,
169
+ "special": true
170
+ },
171
+ "250018": {
172
+ "content": "ne_NP",
173
+ "lstrip": true,
174
+ "normalized": false,
175
+ "rstrip": true,
176
+ "single_word": false,
177
+ "special": true
178
+ },
179
+ "250019": {
180
+ "content": "nl_XX",
181
+ "lstrip": true,
182
+ "normalized": false,
183
+ "rstrip": true,
184
+ "single_word": false,
185
+ "special": true
186
+ },
187
+ "250020": {
188
+ "content": "ro_RO",
189
+ "lstrip": true,
190
+ "normalized": false,
191
+ "rstrip": true,
192
+ "single_word": false,
193
+ "special": true
194
+ },
195
+ "250021": {
196
+ "content": "ru_RU",
197
+ "lstrip": true,
198
+ "normalized": false,
199
+ "rstrip": true,
200
+ "single_word": false,
201
+ "special": true
202
+ },
203
+ "250022": {
204
+ "content": "si_LK",
205
+ "lstrip": true,
206
+ "normalized": false,
207
+ "rstrip": true,
208
+ "single_word": false,
209
+ "special": true
210
+ },
211
+ "250023": {
212
+ "content": "tr_TR",
213
+ "lstrip": true,
214
+ "normalized": false,
215
+ "rstrip": true,
216
+ "single_word": false,
217
+ "special": true
218
+ },
219
+ "250024": {
220
+ "content": "vi_VN",
221
+ "lstrip": true,
222
+ "normalized": false,
223
+ "rstrip": true,
224
+ "single_word": false,
225
+ "special": true
226
+ },
227
+ "250025": {
228
+ "content": "zh_CN",
229
+ "lstrip": true,
230
+ "normalized": false,
231
+ "rstrip": true,
232
+ "single_word": false,
233
+ "special": true
234
+ },
235
+ "250026": {
236
+ "content": "af_ZA",
237
+ "lstrip": true,
238
+ "normalized": false,
239
+ "rstrip": true,
240
+ "single_word": false,
241
+ "special": true
242
+ },
243
+ "250027": {
244
+ "content": "az_AZ",
245
+ "lstrip": true,
246
+ "normalized": false,
247
+ "rstrip": true,
248
+ "single_word": false,
249
+ "special": true
250
+ },
251
+ "250028": {
252
+ "content": "bn_IN",
253
+ "lstrip": true,
254
+ "normalized": false,
255
+ "rstrip": true,
256
+ "single_word": false,
257
+ "special": true
258
+ },
259
+ "250029": {
260
+ "content": "fa_IR",
261
+ "lstrip": true,
262
+ "normalized": false,
263
+ "rstrip": true,
264
+ "single_word": false,
265
+ "special": true
266
+ },
267
+ "250030": {
268
+ "content": "he_IL",
269
+ "lstrip": true,
270
+ "normalized": false,
271
+ "rstrip": true,
272
+ "single_word": false,
273
+ "special": true
274
+ },
275
+ "250031": {
276
+ "content": "hr_HR",
277
+ "lstrip": true,
278
+ "normalized": false,
279
+ "rstrip": true,
280
+ "single_word": false,
281
+ "special": true
282
+ },
283
+ "250032": {
284
+ "content": "id_ID",
285
+ "lstrip": true,
286
+ "normalized": false,
287
+ "rstrip": true,
288
+ "single_word": false,
289
+ "special": true
290
+ },
291
+ "250033": {
292
+ "content": "ka_GE",
293
+ "lstrip": true,
294
+ "normalized": false,
295
+ "rstrip": true,
296
+ "single_word": false,
297
+ "special": true
298
+ },
299
+ "250034": {
300
+ "content": "km_KH",
301
+ "lstrip": true,
302
+ "normalized": false,
303
+ "rstrip": true,
304
+ "single_word": false,
305
+ "special": true
306
+ },
307
+ "250035": {
308
+ "content": "mk_MK",
309
+ "lstrip": true,
310
+ "normalized": false,
311
+ "rstrip": true,
312
+ "single_word": false,
313
+ "special": true
314
+ },
315
+ "250036": {
316
+ "content": "ml_IN",
317
+ "lstrip": true,
318
+ "normalized": false,
319
+ "rstrip": true,
320
+ "single_word": false,
321
+ "special": true
322
+ },
323
+ "250037": {
324
+ "content": "mn_MN",
325
+ "lstrip": true,
326
+ "normalized": false,
327
+ "rstrip": true,
328
+ "single_word": false,
329
+ "special": true
330
+ },
331
+ "250038": {
332
+ "content": "mr_IN",
333
+ "lstrip": true,
334
+ "normalized": false,
335
+ "rstrip": true,
336
+ "single_word": false,
337
+ "special": true
338
+ },
339
+ "250039": {
340
+ "content": "pl_PL",
341
+ "lstrip": true,
342
+ "normalized": false,
343
+ "rstrip": true,
344
+ "single_word": false,
345
+ "special": true
346
+ },
347
+ "250040": {
348
+ "content": "ps_AF",
349
+ "lstrip": true,
350
+ "normalized": false,
351
+ "rstrip": true,
352
+ "single_word": false,
353
+ "special": true
354
+ },
355
+ "250041": {
356
+ "content": "pt_XX",
357
+ "lstrip": true,
358
+ "normalized": false,
359
+ "rstrip": true,
360
+ "single_word": false,
361
+ "special": true
362
+ },
363
+ "250042": {
364
+ "content": "sv_SE",
365
+ "lstrip": true,
366
+ "normalized": false,
367
+ "rstrip": true,
368
+ "single_word": false,
369
+ "special": true
370
+ },
371
+ "250043": {
372
+ "content": "sw_KE",
373
+ "lstrip": true,
374
+ "normalized": false,
375
+ "rstrip": true,
376
+ "single_word": false,
377
+ "special": true
378
+ },
379
+ "250044": {
380
+ "content": "ta_IN",
381
+ "lstrip": true,
382
+ "normalized": false,
383
+ "rstrip": true,
384
+ "single_word": false,
385
+ "special": true
386
+ },
387
+ "250045": {
388
+ "content": "te_IN",
389
+ "lstrip": true,
390
+ "normalized": false,
391
+ "rstrip": true,
392
+ "single_word": false,
393
+ "special": true
394
+ },
395
+ "250046": {
396
+ "content": "th_TH",
397
+ "lstrip": true,
398
+ "normalized": false,
399
+ "rstrip": true,
400
+ "single_word": false,
401
+ "special": true
402
+ },
403
+ "250047": {
404
+ "content": "tl_XX",
405
+ "lstrip": true,
406
+ "normalized": false,
407
+ "rstrip": true,
408
+ "single_word": false,
409
+ "special": true
410
+ },
411
+ "250048": {
412
+ "content": "uk_UA",
413
+ "lstrip": true,
414
+ "normalized": false,
415
+ "rstrip": true,
416
+ "single_word": false,
417
+ "special": true
418
+ },
419
+ "250049": {
420
+ "content": "ur_PK",
421
+ "lstrip": true,
422
+ "normalized": false,
423
+ "rstrip": true,
424
+ "single_word": false,
425
+ "special": true
426
+ },
427
+ "250050": {
428
+ "content": "xh_ZA",
429
+ "lstrip": true,
430
+ "normalized": false,
431
+ "rstrip": true,
432
+ "single_word": false,
433
+ "special": true
434
+ },
435
+ "250051": {
436
+ "content": "gl_ES",
437
+ "lstrip": true,
438
+ "normalized": false,
439
+ "rstrip": true,
440
+ "single_word": false,
441
+ "special": true
442
+ },
443
+ "250052": {
444
+ "content": "sl_SI",
445
+ "lstrip": true,
446
+ "normalized": false,
447
+ "rstrip": true,
448
+ "single_word": false,
449
+ "special": true
450
+ },
451
+ "250053": {
452
+ "content": "<mask>",
453
+ "lstrip": true,
454
+ "normalized": false,
455
+ "rstrip": false,
456
+ "single_word": false,
457
+ "special": true
458
+ }
459
+ },
460
  "additional_special_tokens": [
461
  "ar_AR",
462
  "cs_CZ",
 
515
  "clean_up_tokenization_spaces": true,
516
  "cls_token": "<s>",
517
  "eos_token": "</s>",
518
+ "mask_token": "<mask>",
 
 
 
 
 
 
 
519
  "model_max_length": 1024,
520
  "pad_token": "<pad>",
521
  "sep_token": "</s>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b97f6488aa515fe6f173ab735ce4ef9098b808c2546d67579de20ac422d4ffb
3
- size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff36007d320a3ebb0060c77790cf86201aa9f79b6ba9fad1093e69eaeedbec02
3
+ size 4283