ilyes25 commited on
Commit
83c4a75
·
verified ·
1 Parent(s): b49e67c

End of training

Browse files
Files changed (5) hide show
  1. README.md +47 -38
  2. adapter.fr.safetensors +3 -0
  3. config.json +2 -2
  4. model.safetensors +2 -2
  5. training_args.bin +1 -1
README.md CHANGED
@@ -20,10 +20,10 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [facebook/mms-1b-all](https://huggingface.co/facebook/mms-1b-all) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.3318
24
- - Wer: 0.5332
25
- - Bleu: {'bleu': 0.20626502760570276, 'precisions': [0.4828561729093584, 0.26526984126984127, 0.15708092485549133, 0.09694133377904061], 'brevity_penalty': 0.9815017376632986, 'length_ratio': 0.981670739835592, 'translation_length': 8837, 'reference_length': 9002}
26
- - Rouge: {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0}
27
 
28
  ## Model description
29
 
@@ -51,44 +51,53 @@ The following hyperparameters were used during training:
51
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
52
  - lr_scheduler_type: linear
53
  - lr_scheduler_warmup_steps: 500
54
- - num_epochs: 100
55
  - mixed_precision_training: Native AMP
56
 
57
  ### Training results
58
 
59
- | Training Loss | Epoch | Step | Validation Loss | Wer | Bleu | Rouge |
60
- |:-------------:|:-----:|:----:|:---------------:|:------:|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------:|
61
- | 8.9409 | 1.0 | 121 | 7.3836 | 1.0009 | {'bleu': 0.0, 'precisions': [0.0, 0.0, 0.0, 0.0], 'brevity_penalty': 0.15361828967433966, 'length_ratio': 0.3480337702732726, 'translation_length': 3133, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
62
- | 5.8951 | 2.0 | 242 | 3.9240 | 1.0 | {'bleu': 0.0, 'precisions': [0.0, 0.0, 0.0, 0.0], 'brevity_penalty': 0.00023460944616129434, 'length_ratio': 0.10686514107976006, 'translation_length': 962, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
63
- | 3.448 | 3.0 | 363 | 3.3244 | 1.0072 | {'bleu': 0.0, 'precisions': [0.00021687269572760788, 0.0, 0.0, 0.0], 'brevity_penalty': 0.38585716882722343, 'length_ratio': 0.5122195067762719, 'translation_length': 4611, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
64
- | 3.3048 | 4.0 | 484 | 3.2099 | 1.0540 | {'bleu': 0.0, 'precisions': [0.0012913223140495868, 0.0, 0.0, 0.0], 'brevity_penalty': 0.8500599971491325, 'length_ratio': 0.8602532770495446, 'translation_length': 7744, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
65
- | 1.3604 | 5.0 | 605 | 0.6633 | 0.7965 | {'bleu': 0.034929556738440316, 'precisions': [0.21936736325225534, 0.05991019884541373, 0.017828437819669734, 0.007105396717983421], 'brevity_penalty': 0.9724101311329575, 'length_ratio': 0.9727838258164853, 'translation_length': 8757, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
66
- | 0.6764 | 6.0 | 726 | 0.4717 | 0.6724 | {'bleu': 0.09414039105458619, 'precisions': [0.34541504687857305, 0.1395169578622816, 0.06105417276720351, 0.030010172939979655], 'brevity_penalty': 0.9711537088639254, 'length_ratio': 0.971561875138858, 'translation_length': 8746, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
67
- | 0.6118 | 7.0 | 847 | 0.4297 | 0.6431 | {'bleu': 0.10327123610576155, 'precisions': [0.3748719699556162, 0.1584664536741214, 0.06853899883585565, 0.03080808080808081], 'brevity_penalty': 0.9758289500370382, 'length_ratio': 0.9761164185736503, 'translation_length': 8787, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
68
- | 0.5499 | 8.0 | 968 | 0.4136 | 0.6383 | {'bleu': 0.09547633908306723, 'precisions': [0.37913718329148594, 0.15538461538461537, 0.06206191588785047, 0.0253592561284869], 'brevity_penalty': 0.9729807252327849, 'length_ratio': 0.9733392579426794, 'translation_length': 8762, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
69
- | 0.5426 | 9.0 | 1089 | 0.3948 | 0.6236 | {'bleu': 0.1146211663681401, 'precisions': [0.3941814033086138, 0.1719851339228502, 0.07882061012990804, 0.03599188915174045], 'brevity_penalty': 0.973322929713784, 'length_ratio': 0.9736725172183959, 'translation_length': 8765, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
70
- | 0.5224 | 10.0 | 1210 | 0.3845 | 0.6133 | {'bleu': 0.14615786010373802, 'precisions': [0.4039206747207659, 0.19687660010240654, 0.10451895043731778, 0.060917988525143435], 'brevity_penalty': 0.9743488596571711, 'length_ratio': 0.9746722950455454, 'translation_length': 8774, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
71
- | 0.5106 | 11.0 | 1331 | 0.3768 | 0.6081 | {'bleu': 0.14761534429663833, 'precisions': [0.4103973434100538, 0.2001029468536868, 0.10602727672679278, 0.0616822429906542], 'brevity_penalty': 0.969666867156736, 'length_ratio': 0.9701177516107532, 'translation_length': 8733, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
72
- | 0.4808 | 12.0 | 1452 | 0.3689 | 0.6038 | {'bleu': 0.14419001572294796, 'precisions': [0.4128158433872069, 0.20002556237218813, 0.10203784570596798, 0.05660377358490566], 'brevity_penalty': 0.9757151727531809, 'length_ratio': 0.9760053321484115, 'translation_length': 8786, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
73
- | 0.4887 | 13.0 | 1573 | 0.3645 | 0.5959 | {'bleu': 0.14552105797325302, 'precisions': [0.4212262541235354, 0.20283561118916849, 0.10340314136125654, 0.0558734432850892], 'brevity_penalty': 0.9762839328773337, 'length_ratio': 0.9765607642746057, 'translation_length': 8791, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
74
- | 0.4868 | 14.0 | 1694 | 0.3618 | 0.5964 | {'bleu': 0.14398457640279802, 'precisions': [0.4209029910155806, 0.20061294853786235, 0.10206455364931666, 0.05484522207267833], 'brevity_penalty': 0.9765113485390307, 'length_ratio': 0.9767829371250834, 'translation_length': 8793, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
75
- | 0.4694 | 15.0 | 1815 | 0.3552 | 0.5896 | {'bleu': 0.1407651620422715, 'precisions': [0.42652899126290705, 0.20315883326964718, 0.1007830626450116, 0.04898506961919141], 'brevity_penalty': 0.978782729886213, 'length_ratio': 0.97900466562986, 'translation_length': 8813, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
76
- | 0.4717 | 16.0 | 1936 | 0.3515 | 0.5820 | {'bleu': 0.14704090054592955, 'precisions': [0.4347430650295589, 0.21087567015573142, 0.10566860465116279, 0.05299461641991925], 'brevity_penalty': 0.9768523773634661, 'length_ratio': 0.9771161964007998, 'translation_length': 8796, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
77
- | 0.4697 | 17.0 | 2057 | 0.3472 | 0.5820 | {'bleu': 0.16519675176223306, 'precisions': [0.4347628256171084, 0.221356495082386, 0.12045388420133837, 0.0707189762586294], 'brevity_penalty': 0.9762839328773337, 'length_ratio': 0.9765607642746057, 'translation_length': 8791, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
78
- | 0.4495 | 18.0 | 2178 | 0.3440 | 0.5790 | {'bleu': 0.16684635490186076, 'precisions': [0.4380551127305853, 0.22327365728900256, 0.12163146394756008, 0.07200674536256324], 'brevity_penalty': 0.9752599372827168, 'length_ratio': 0.9755609864474561, 'translation_length': 8782, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
79
- | 0.4415 | 19.0 | 2299 | 0.3415 | 0.5724 | {'bleu': 0.162083792001847, 'precisions': [0.4451789377706861, 0.22375832053251407, 0.11798162461717952, 0.06515867656988521], 'brevity_penalty': 0.9743488596571711, 'length_ratio': 0.9746722950455454, 'translation_length': 8774, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
80
- | 0.4418 | 20.0 | 2420 | 0.3407 | 0.5635 | {'bleu': 0.1651392945199903, 'precisions': [0.45348043676069155, 0.22924648786717752, 0.12087272727272727, 0.06511862695608278], 'brevity_penalty': 0.9763976470202772, 'length_ratio': 0.9766718506998445, 'translation_length': 8792, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
81
- | 0.4411 | 21.0 | 2541 | 0.3380 | 0.5612 | {'bleu': 0.17032448446358872, 'precisions': [0.4554837246228876, 0.2328453214513049, 0.12492753623188406, 0.06908115358819585], 'brevity_penalty': 0.9792364011971344, 'length_ratio': 0.9794490113308154, 'translation_length': 8817, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
82
- | 0.4368 | 22.0 | 2662 | 0.3403 | 0.5563 | {'bleu': 0.17429463351579735, 'precisions': [0.46019505556815604, 0.2389256619144603, 0.12896681640341978, 0.07074601844090528], 'brevity_penalty': 0.9793497875444289, 'length_ratio': 0.9795600977560542, 'translation_length': 8818, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
83
- | 0.4322 | 23.0 | 2783 | 0.3307 | 0.5598 | {'bleu': 0.18466486831726667, 'precisions': [0.4570876435148346, 0.24365028717294193, 0.1379360465116279, 0.08309503784693019], 'brevity_penalty': 0.9769660283987757, 'length_ratio': 0.9772272828260387, 'translation_length': 8797, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
84
- | 0.4263 | 24.0 | 2904 | 0.3398 | 0.5549 | {'bleu': 0.1797281293297898, 'precisions': [0.46188799272975123, 0.2423160311184798, 0.13404008132442638, 0.07613445378151261], 'brevity_penalty': 0.9776476696891355, 'length_ratio': 0.9778938013774717, 'translation_length': 8803, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
85
- | 0.4102 | 25.0 | 3025 | 0.3253 | 0.5472 | {'bleu': 0.19095303691786358, 'precisions': [0.469932931681255, 0.25488194001276326, 0.14375, 0.08476286579212916], 'brevity_penalty': 0.9769660283987757, 'length_ratio': 0.9772272828260387, 'translation_length': 8797, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
86
- | 0.4236 | 26.0 | 3146 | 0.3274 | 0.5474 | {'bleu': 0.18409612160683292, 'precisions': [0.4694085656016315, 0.2483468972533062, 0.13677811550151975, 0.07801774652603381], 'brevity_penalty': 0.9802564252131077, 'length_ratio': 0.9804487891579649, 'translation_length': 8826, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
87
- | 0.4177 | 27.0 | 3267 | 0.3255 | 0.5419 | {'bleu': 0.19152955171945296, 'precisions': [0.47450135992747056, 0.25489697278046297, 0.14405675401766324, 0.08372404554588078], 'brevity_penalty': 0.980029841295489, 'length_ratio': 0.9802266163074872, 'translation_length': 8824, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
88
- | 0.4051 | 28.0 | 3388 | 0.3218 | 0.5380 | {'bleu': 0.20391771010111173, 'precisions': [0.47922814982973894, 0.2658002038735984, 0.1550848687073843, 0.09550184625713326], 'brevity_penalty': 0.9784423441477751, 'length_ratio': 0.9786714063541435, 'translation_length': 8810, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
89
- | 0.3993 | 29.0 | 3509 | 0.3225 | 0.5364 | {'bleu': 0.1991760083321937, 'precisions': [0.4802765812740875, 0.26145038167938933, 0.15090514120202753, 0.09011725293132328], 'brevity_penalty': 0.9798032070519724, 'length_ratio': 0.9800044434570095, 'translation_length': 8822, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
90
- | 0.3942 | 30.0 | 3630 | 0.3230 | 0.5335 | {'bleu': 0.20119532062721326, 'precisions': [0.48279375141498754, 0.2630843495934959, 0.15223362729507012, 0.09144098963557339], 'brevity_penalty': 0.981162257838828, 'length_ratio': 0.9813374805598756, 'translation_length': 8834, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
91
- | 0.3846 | 31.0 | 3751 | 0.3318 | 0.5332 | {'bleu': 0.20626502760570276, 'precisions': [0.4828561729093584, 0.26526984126984127, 0.15708092485549133, 0.09694133377904061], 'brevity_penalty': 0.9815017376632986, 'length_ratio': 0.981670739835592, 'translation_length': 8837, 'reference_length': 9002} | {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0} |
 
 
 
 
 
 
 
 
 
92
 
93
 
94
  ### Framework versions
 
20
 
21
  This model is a fine-tuned version of [facebook/mms-1b-all](https://huggingface.co/facebook/mms-1b-all) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.1983
24
+ - Wer: 0.1456
25
+ - Bleu: {'bleu': 0.7492044741492486, 'precisions': [0.8730063030967389, 0.7883760255527025, 0.7152661166678835, 0.6510430304617264], 'brevity_penalty': 0.9957339815437508, 'length_ratio': 0.995743055176554, 'translation_length': 18245, 'reference_length': 18323}
26
+ - Rouge: {'rouge1': 0.8748364322650914, 'rouge2': 0.7928723605220098, 'rougeL': 0.8745015805780032, 'rougeLsum': 0.8743113489400196}
27
 
28
  ## Model description
29
 
 
51
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
52
  - lr_scheduler_type: linear
53
  - lr_scheduler_warmup_steps: 500
54
+ - num_epochs: 40
55
  - mixed_precision_training: Native AMP
56
 
57
  ### Training results
58
 
59
+ | Training Loss | Epoch | Step | Validation Loss | Wer | Bleu | Rouge |
60
+ |:-------------:|:-------:|:-----:|:---------------:|:------:|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------------------------------------------------------------------:|
61
+ | 5.9588 | 1.0 | 285 | 2.7873 | 0.9827 | {'bleu': 0.0, 'precisions': [0.059154929577464786, 0.0, 0.0, 0.0], 'brevity_penalty': 0.11433624320676729, 'length_ratio': 0.3155956311912624, 'translation_length': 2485, 'reference_length': 7874} | {'rouge1': 0.03875997597517414, 'rouge2': 0.0, 'rougeL': 0.03892048827301332, 'rougeLsum': 0.038793322006122906} |
62
+ | 0.4602 | 2.0 | 570 | 0.3555 | 0.2311 | {'bleu': 0.6283054199052752, 'precisions': [0.7993283417749394, 0.6805363212891854, 0.5854142185663925, 0.5068155835018908], 'brevity_penalty': 0.9912846225149247, 'length_ratio': 0.9913223817060525, 'translation_length': 18164, 'reference_length': 18323} | {'rouge1': 0.7917720369498722, 'rouge2': 0.6755927340957304, 'rougeL': 0.7912377266650397, 'rougeLsum': 0.7913035186420103} |
63
+ | 0.3842 | 3.0 | 855 | 0.3058 | 0.2090 | {'bleu': 0.6605337548855493, 'precisions': [0.8175150519978106, 0.7074787393696849, 0.616208731142045, 0.5403591352859135], 'brevity_penalty': 0.99710327314591, 'length_ratio': 0.9971074605686842, 'translation_length': 18270, 'reference_length': 18323} | {'rouge1': 0.8146357732958056, 'rouge2': 0.7071194587560558, 'rougeL': 0.814052758845498, 'rougeLsum': 0.8138241815295024} |
64
+ | 0.3719 | 4.0 | 1140 | 0.2868 | 0.2010 | {'bleu': 0.6712219662583173, 'precisions': [0.8250068549492734, 0.7188067932568779, 0.6293752283522105, 0.5544580419580419], 'brevity_penalty': 0.9951857415819062, 'length_ratio': 0.9951972930197021, 'translation_length': 18235, 'reference_length': 18323} | {'rouge1': 0.8222029713967768, 'rouge2': 0.7197657000623603, 'rougeL': 0.8217923739918656, 'rougeLsum': 0.821719465931791} |
65
+ | 0.3336 | 5.0 | 1425 | 0.2742 | 0.1959 | {'bleu': 0.6785372107003715, 'precisions': [0.8300621254604431, 0.7259128904531457, 0.6393695014662757, 0.5666900666900667], 'brevity_penalty': 0.9926599804903764, 'length_ratio': 0.9926867870981826, 'translation_length': 18189, 'reference_length': 18323} | {'rouge1': 0.8265645999560629, 'rouge2': 0.7247965384723267, 'rougeL': 0.8259582425920233, 'rougeLsum': 0.8259017198295564} |
66
+ | 0.3442 | 6.0 | 1710 | 0.2642 | 0.1903 | {'bleu': 0.6873788245362181, 'precisions': [0.832968476357268, 0.7314617981743153, 0.6461886022445708, 0.5733948950256991], 'brevity_penalty': 0.9972127357870568, 'length_ratio': 0.9972166130000546, 'translation_length': 18272, 'reference_length': 18323} | {'rouge1': 0.8325100938158259, 'rouge2': 0.7340864170622121, 'rougeL': 0.83191579042451, 'rougeLsum': 0.8318541463934617} |
67
+ | 0.3341 | 7.0 | 1995 | 0.2582 | 0.1843 | {'bleu': 0.6963666431657629, 'precisions': [0.839673317254988, 0.7409495177251659, 0.6574662285505659, 0.5849270806043141], 'brevity_penalty': 0.9956791710107048, 'length_ratio': 0.9956884789608689, 'translation_length': 18244, 'reference_length': 18323} | {'rouge1': 0.838537901118194, 'rouge2': 0.7427526814996277, 'rougeL': 0.8379557459558569, 'rougeLsum': 0.8379007055417265} |
68
+ | 0.3172 | 8.0 | 2280 | 0.2494 | 0.1804 | {'bleu': 0.7001144932835086, 'precisions': [0.843205001645278, 0.7451742291301078, 0.6613327487943884, 0.5895822408669813], 'brevity_penalty': 0.9951309011278089, 'length_ratio': 0.9951427168040168, 'translation_length': 18234, 'reference_length': 18323} | {'rouge1': 0.8428458068475617, 'rouge2': 0.7473487117700717, 'rougeL': 0.8422200154587571, 'rougeLsum': 0.8420994714247132} |
69
+ | 0.294 | 9.0 | 2565 | 0.2444 | 0.1784 | {'bleu': 0.7015679264162828, 'precisions': [0.8458917284968398, 0.7474398441917447, 0.6644683813292299, 0.5931088900578643], 'brevity_penalty': 0.9929897872850882, 'length_ratio': 0.9930142443922938, 'translation_length': 18195, 'reference_length': 18323} | {'rouge1': 0.8447332085359476, 'rouge2': 0.7490673320409132, 'rougeL': 0.8441531451631874, 'rougeLsum': 0.843987486458086} |
70
+ | 0.2927 | 10.0 | 2850 | 0.2395 | 0.1734 | {'bleu': 0.7094676103718882, 'precisions': [0.8488569705608245, 0.7529912923635909, 0.6714379610019718, 0.6010480349344978], 'brevity_penalty': 0.9955147214626567, 'length_ratio': 0.9955247503138133, 'translation_length': 18241, 'reference_length': 18323} | {'rouge1': 0.8488302350839227, 'rouge2': 0.7554473763418516, 'rougeL': 0.848226337259566, 'rougeLsum': 0.8481517731134592} |
71
+ | 0.2974 | 11.0 | 3135 | 0.2361 | 0.1757 | {'bleu': 0.7073575226963291, 'precisions': [0.8489256198347107, 0.7540322580645161, 0.6735038964858109, 0.6032737833318665], 'brevity_penalty': 0.9905136020383278, 'length_ratio': 0.9905583146864596, 'translation_length': 18150, 'reference_length': 18323} | {'rouge1': 0.8469188343317979, 'rouge2': 0.753826185237243, 'rougeL': 0.8462106498895938, 'rougeLsum': 0.8462690600047347} |
72
+ | 0.2929 | 12.0 | 3420 | 0.2323 | 0.1710 | {'bleu': 0.7104887814499381, 'precisions': [0.8529363110008271, 0.7578987198082866, 0.6768970339294914, 0.6069980609906575], 'brevity_penalty': 0.9896868547353578, 'length_ratio': 0.9897396714511816, 'translation_length': 18135, 'reference_length': 18323} | {'rouge1': 0.851535800343566, 'rouge2': 0.7594371464363054, 'rougeL': 0.8507125679902645, 'rougeLsum': 0.8505546552290876} |
73
+ | 0.2922 | 13.0 | 3705 | 0.2277 | 0.1690 | {'bleu': 0.7147023714998528, 'precisions': [0.8544513001322168, 0.7611188106337408, 0.6811967068509261, 0.6115804294262583], 'brevity_penalty': 0.9906237838889417, 'length_ratio': 0.99066746711783, 'translation_length': 18152, 'reference_length': 18323} | {'rouge1': 0.8532183741925291, 'rouge2': 0.7629739149453718, 'rougeL': 0.8526967418105296, 'rougeLsum': 0.8525344290554377} |
74
+ | 0.2723 | 14.0 | 3990 | 0.2255 | 0.1665 | {'bleu': 0.7185286342228578, 'precisions': [0.8572294801830108, 0.7651768265775705, 0.6859412933127345, 0.6166784078901022], 'brevity_penalty': 0.9900176348680043, 'length_ratio': 0.9900671287452928, 'translation_length': 18141, 'reference_length': 18323} | {'rouge1': 0.8554844372155834, 'rouge2': 0.7665585766259185, 'rougeL': 0.8550678894072193, 'rougeLsum': 0.8549249072117735} |
75
+ | 0.2618 | 15.0 | 4275 | 0.2216 | 0.1647 | {'bleu': 0.7205920025415866, 'precisions': [0.8575904144223371, 0.7653304850464941, 0.6855488787923201, 0.6164635749978084], 'brevity_penalty': 0.9929348269851479, 'length_ratio': 0.9929596681766086, 'translation_length': 18194, 'reference_length': 18323} | {'rouge1': 0.8572991962911986, 'rouge2': 0.7687939439030189, 'rougeL': 0.8569135698404339, 'rougeLsum': 0.8567069159809071} |
76
+ | 0.2824 | 16.0 | 4560 | 0.2194 | 0.1625 | {'bleu': 0.7248245517316763, 'precisions': [0.859585463741822, 0.7690277166739992, 0.6911516750971336, 0.6221929824561403], 'brevity_penalty': 0.9926599804903764, 'length_ratio': 0.9926867870981826, 'translation_length': 18189, 'reference_length': 18323} | {'rouge1': 0.860740052677103, 'rouge2': 0.7738344427906813, 'rougeL': 0.8602549832284943, 'rougeLsum': 0.8601224055557424} |
77
+ | 0.2584 | 17.0 | 4845 | 0.2184 | 0.1624 | {'bleu': 0.7233957743502292, 'precisions': [0.8591843464878531, 0.7673410404624278, 0.689066393082222, 0.6201332865661171], 'brevity_penalty': 0.9929348269851479, 'length_ratio': 0.9929596681766086, 'translation_length': 18194, 'reference_length': 18323} | {'rouge1': 0.8596520621812659, 'rouge2': 0.7716232895345339, 'rougeL': 0.8592810276384565, 'rougeLsum': 0.85911704018123} |
78
+ | 0.2626 | 18.0 | 5130 | 0.2162 | 0.1575 | {'bleu': 0.7321328546559496, 'precisions': [0.8624205218153914, 0.7733308280095202, 0.6966267523364486, 0.6292125021826436], 'brevity_penalty': 0.9956791710107048, 'length_ratio': 0.9956884789608689, 'translation_length': 18244, 'reference_length': 18323} | {'rouge1': 0.8630838420026828, 'rouge2': 0.7773667756363078, 'rougeL': 0.8628126973557786, 'rougeLsum': 0.8627419660979692} |
79
+ | 0.2518 | 19.0 | 5415 | 0.2132 | 0.1577 | {'bleu': 0.7305988372304458, 'precisions': [0.8624547548535703, 0.7728127350213086, 0.6953821423352331, 0.6268461067901774], 'brevity_penalty': 0.9951309011278089, 'length_ratio': 0.9951427168040168, 'translation_length': 18234, 'reference_length': 18323} | {'rouge1': 0.8638253584058928, 'rouge2': 0.7773261199114829, 'rougeL': 0.8632427380502744, 'rougeLsum': 0.8631565081641605} |
80
+ | 0.2624 | 20.0 | 5700 | 0.2114 | 0.1561 | {'bleu': 0.7336678313741997, 'precisions': [0.8624801706690006, 0.7734799725051553, 0.6966431224058837, 0.6291880602210426], 'brevity_penalty': 0.9977051698422599, 'length_ratio': 0.9977077989412214, 'translation_length': 18281, 'reference_length': 18323} | {'rouge1': 0.8643711864157274, 'rouge2': 0.7789576656096648, 'rougeL': 0.864045843841154, 'rougeLsum': 0.8639432546192249} |
81
+ | 0.274 | 21.0 | 5985 | 0.2125 | 0.1572 | {'bleu': 0.7327413298256028, 'precisions': [0.8631249656989188, 0.7743210186288654, 0.6986762232136327, 0.6313303594856993], 'brevity_penalty': 0.9944177028031576, 'length_ratio': 0.9944332260001092, 'translation_length': 18221, 'reference_length': 18323} | {'rouge1': 0.8637561560608497, 'rouge2': 0.7775626243197682, 'rougeL': 0.8633528770604967, 'rougeLsum': 0.8632085396165139} |
82
+ | 0.2484 | 22.0 | 6270 | 0.2091 | 0.1552 | {'bleu': 0.7357839881765593, 'precisions': [0.8648885962023927, 0.7774711490215755, 0.7019160450489981, 0.634892872759073], 'brevity_penalty': 0.9944725821787992, 'length_ratio': 0.9944878022157944, 'translation_length': 18222, 'reference_length': 18323} | {'rouge1': 0.8659727708387619, 'rouge2': 0.7816164515395694, 'rougeL': 0.8657951715895931, 'rougeLsum': 0.8655840959367318} |
83
+ | 0.2473 | 23.0 | 6555 | 0.2090 | 0.1554 | {'bleu': 0.7356730614040227, 'precisions': [0.8642543859649123, 0.7763438165643403, 0.7012123867952089, 0.6340143181421337], 'brevity_penalty': 0.9954598989631315, 'length_ratio': 0.995470174098128, 'translation_length': 18240, 'reference_length': 18323} | {'rouge1': 0.865456270958754, 'rouge2': 0.7804951440612873, 'rougeL': 0.8652647943705735, 'rougeLsum': 0.8649670956520807} |
84
+ | 0.2418 | 24.0 | 6840 | 0.2055 | 0.1553 | {'bleu': 0.7347926831245415, 'precisions': [0.8653296703296703, 0.7771008667252858, 0.7016554351010841, 0.634770417104802], 'brevity_penalty': 0.9932645437985937, 'length_ratio': 0.9932871254707198, 'translation_length': 18200, 'reference_length': 18323} | {'rouge1': 0.8654752140097928, 'rouge2': 0.7807218611868961, 'rougeL': 0.8652326088546789, 'rougeLsum': 0.8650739915057691} |
85
+ | 0.2577 | 25.0 | 7125 | 0.2040 | 0.1515 | {'bleu': 0.7395907984479824, 'precisions': [0.8676938260774207, 0.7802005012531328, 0.7051132213294375, 0.6386026200873363], 'brevity_penalty': 0.9953502449878465, 'length_ratio': 0.9953610216667577, 'translation_length': 18238, 'reference_length': 18323} | {'rouge1': 0.8685153389774867, 'rouge2': 0.7838568977155047, 'rougeL': 0.8683321242058704, 'rougeLsum': 0.8680531173155077} |
86
+ | 0.2478 | 26.0 | 7410 | 0.2035 | 0.1523 | {'bleu': 0.7389574395410246, 'precisions': [0.8673581385138843, 0.7797917711991972, 0.7048413046657891, 0.639496239286339], 'brevity_penalty': 0.9944725821787992, 'length_ratio': 0.9944878022157944, 'translation_length': 18222, 'reference_length': 18323} | {'rouge1': 0.8684026564775361, 'rouge2': 0.7837147217327451, 'rougeL': 0.8680473992168228, 'rougeLsum': 0.86781442567829} |
87
+ | 0.2345 | 27.0 | 7695 | 0.2036 | 0.1525 | {'bleu': 0.7394120868432645, 'precisions': [0.8659697898423818, 0.7782293360010004, 0.7032206353832702, 0.6378124183575721], 'brevity_penalty': 0.9972127357870568, 'length_ratio': 0.9972166130000546, 'translation_length': 18272, 'reference_length': 18323} | {'rouge1': 0.8680049443409963, 'rouge2': 0.7830505254725744, 'rougeL': 0.8677384137559521, 'rougeLsum': 0.8675358853961506} |
88
+ | 0.2398 | 28.0 | 7980 | 0.2025 | 0.1513 | {'bleu': 0.7410617179914926, 'precisions': [0.8681987713909609, 0.7813087626927416, 0.7069570301081555, 0.6415836392239119], 'brevity_penalty': 0.9950212112404683, 'length_ratio': 0.9950335643726465, 'translation_length': 18232, 'reference_length': 18323} | {'rouge1': 0.8691516758267378, 'rouge2': 0.7855889417660622, 'rougeL': 0.8688010484175208, 'rougeLsum': 0.8685495828117757} |
89
+ | 0.2595 | 29.0 | 8265 | 0.2005 | 0.1506 | {'bleu': 0.7408702837830967, 'precisions': [0.8690567695179532, 0.7818775100401606, 0.7071564466559345, 0.6421881838074398], 'brevity_penalty': 0.9940334633019136, 'length_ratio': 0.9940511924903127, 'translation_length': 18214, 'reference_length': 18323} | {'rouge1': 0.8705678413238229, 'rouge2': 0.7865174894976992, 'rougeL': 0.8703173243712404, 'rougeLsum': 0.8700254528394962} |
90
+ | 0.224 | 30.0 | 8550 | 0.2009 | 0.1487 | {'bleu': 0.7450849356742056, 'precisions': [0.8704333516182118, 0.7844784353059178, 0.7112995176143838, 0.6476140534871526], 'brevity_penalty': 0.9949115093798545, 'length_ratio': 0.994924411941276, 'translation_length': 18230, 'reference_length': 18323} | {'rouge1': 0.8713511668656566, 'rouge2': 0.7878011114559871, 'rougeL': 0.8710130200505186, 'rougeLsum': 0.8707877973869348} |
91
+ | 0.2218 | 31.0 | 8835 | 0.2005 | 0.1492 | {'bleu': 0.7446394749315683, 'precisions': [0.8707180500658761, 0.7851047810264776, 0.7116622768510389, 0.6470073503675183], 'brevity_penalty': 0.9941432609952691, 'length_ratio': 0.9941603449216831, 'translation_length': 18216, 'reference_length': 18323} | {'rouge1': 0.871600980620826, 'rouge2': 0.7896333858185615, 'rougeL': 0.8713249999389157, 'rougeLsum': 0.8710035822779216} |
92
+ | 0.2249 | 32.0 | 9120 | 0.2002 | 0.1496 | {'bleu': 0.7428408162780507, 'precisions': [0.8707584007039543, 0.7850361521534108, 0.7109644297763109, 0.646134947793279], 'brevity_penalty': 0.9923300656862052, 'length_ratio': 0.9923593298040714, 'translation_length': 18183, 'reference_length': 18323} | {'rouge1': 0.871521799540266, 'rouge2': 0.7886835586110674, 'rougeL': 0.8711811073148175, 'rougeLsum': 0.8711031407486098} |
93
+ | 0.2258 | 33.0 | 9405 | 0.2008 | 0.1489 | {'bleu': 0.7436253569604943, 'precisions': [0.8706385780118499, 0.7836990595611285, 0.7097222222222223, 0.6447552447552447], 'brevity_penalty': 0.9948017955446742, 'length_ratio': 0.9948152595099056, 'translation_length': 18228, 'reference_length': 18323} | {'rouge1': 0.8721419286921401, 'rouge2': 0.7882963455000708, 'rougeL': 0.8717333624704182, 'rougeLsum': 0.8716064100420517} |
94
+ | 0.2301 | 34.0 | 9690 | 0.1997 | 0.1469 | {'bleu': 0.7477380046910622, 'precisions': [0.871839868384974, 0.78724070940653, 0.7143274640169504, 0.6500393116100288], 'brevity_penalty': 0.9951857415819062, 'length_ratio': 0.9951972930197021, 'translation_length': 18235, 'reference_length': 18323} | {'rouge1': 0.8733291718803134, 'rouge2': 0.7912828262461826, 'rougeL': 0.8730615834810505, 'rougeLsum': 0.8729508479014352} |
95
+ | 0.2352 | 35.0 | 9975 | 0.1989 | 0.1474 | {'bleu': 0.746786327866007, 'precisions': [0.8721523851347642, 0.7870004391743523, 0.7138049601287585, 0.6497506343512118], 'brevity_penalty': 0.9941981553480093, 'length_ratio': 0.9942149211373683, 'translation_length': 18217, 'reference_length': 18323} | {'rouge1': 0.873008906192879, 'rouge2': 0.790428630395299, 'rougeL': 0.8727160101378854, 'rougeLsum': 0.872513685033558} |
96
+ | 0.2368 | 36.0 | 10260 | 0.1987 | 0.1481 | {'bleu': 0.7450258680082317, 'precisions': [0.8723720418271876, 0.7871255977850491, 0.7142123036264866, 0.6497408416059035], 'brevity_penalty': 0.9916148795787761, 'length_ratio': 0.9916498390001637, 'translation_length': 18170, 'reference_length': 18323} | {'rouge1': 0.872557108952186, 'rouge2': 0.7899616699266603, 'rougeL': 0.8723067110327652, 'rougeLsum': 0.8722357990611533} |
97
+ | 0.2387 | 37.0 | 10545 | 0.1987 | 0.1472 | {'bleu': 0.7461895367214819, 'precisions': [0.871914426769062, 0.7861083249749248, 0.7125420260195878, 0.6478762454116413], 'brevity_penalty': 0.9949115093798545, 'length_ratio': 0.994924411941276, 'translation_length': 18230, 'reference_length': 18323} | {'rouge1': 0.8734065376381056, 'rouge2': 0.7908717014566278, 'rougeL': 0.8730576045837826, 'rougeLsum': 0.8729880391818262} |
98
+ | 0.2198 | 38.0 | 10830 | 0.1984 | 0.1460 | {'bleu': 0.7480290753832786, 'precisions': [0.8731273665148439, 0.7880840388836626, 0.7149542961608775, 0.6505465675557499], 'brevity_penalty': 0.9945274585595061, 'length_ratio': 0.9945423784314795, 'translation_length': 18223, 'reference_length': 18323} | {'rouge1': 0.8746790367634547, 'rouge2': 0.7924947185694857, 'rougeL': 0.8743742574864739, 'rougeLsum': 0.8741497830000428} |
99
+ | 0.2261 | 39.0 | 11115 | 0.1981 | 0.1461 | {'bleu': 0.7482856703011707, 'precisions': [0.8729975861312267, 0.7880877742946708, 0.7149853801169591, 0.6507867132867133], 'brevity_penalty': 0.9948017955446742, 'length_ratio': 0.9948152595099056, 'translation_length': 18228, 'reference_length': 18323} | {'rouge1': 0.8746130363164816, 'rouge2': 0.7924162570451201, 'rougeL': 0.8742493430241225, 'rougeLsum': 0.8740282212067312} |
100
+ | 0.2274 | 39.8604 | 11360 | 0.1983 | 0.1456 | {'bleu': 0.7492044741492486, 'precisions': [0.8730063030967389, 0.7883760255527025, 0.7152661166678835, 0.6510430304617264], 'brevity_penalty': 0.9957339815437508, 'length_ratio': 0.995743055176554, 'translation_length': 18245, 'reference_length': 18323} | {'rouge1': 0.8748364322650914, 'rouge2': 0.7928723605220098, 'rougeL': 0.8745015805780032, 'rougeLsum': 0.8743113489400196} |
101
 
102
 
103
  ### Framework versions
adapter.fr.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43d625a76d3bf29c50b42f05480ec25e6428d16b01ada841324577f8e74b0cab
3
+ size 8870276
config.json CHANGED
@@ -77,7 +77,7 @@
77
  "num_hidden_layers": 48,
78
  "num_negatives": 100,
79
  "output_hidden_size": 1280,
80
- "pad_token_id": 55,
81
  "proj_codevector_dim": 1024,
82
  "tdnn_dilation": [
83
  1,
@@ -103,6 +103,6 @@
103
  "torch_dtype": "float32",
104
  "transformers_version": "4.49.0",
105
  "use_weighted_layer_sum": false,
106
- "vocab_size": 58,
107
  "xvector_output_dim": 512
108
  }
 
77
  "num_hidden_layers": 48,
78
  "num_negatives": 100,
79
  "output_hidden_size": 1280,
80
+ "pad_token_id": 42,
81
  "proj_codevector_dim": 1024,
82
  "tdnn_dilation": [
83
  1,
 
103
  "torch_dtype": "float32",
104
  "transformers_version": "4.49.0",
105
  "use_weighted_layer_sum": false,
106
+ "vocab_size": 45,
107
  "xvector_output_dim": 512
108
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f480f95da2d14aacc99955561a1be43fa28819b1b11fff4e4779875d42a11cf3
3
- size 3859029272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fe80b3603bbec60a90f3b430052b011f01a2bee96eeb45c79b9171a42453f39
3
+ size 3858962660
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2c4357cc770c91cd000a5f54167afc9f8befa84bb10ca226680d0b0ce2e4830
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8459abaa8973435028a440c432b0587c88a97983c820ee22fa6d8fe97848a0fb
3
  size 5368