Fix: upload medium size model instead of small

by Lauler - opened 9 days ago

←

Files changed (3) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/leonardo_work/EUHPC_A01_006/experiments_whisper/stage1_results/small/",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "apply_spec_augment": false,
@@ -10,17 +10,17 @@
   "begin_suppress_tokens": null,
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
-  "d_model": 768,
-  "decoder_attention_heads": 12,
-  "decoder_ffn_dim": 3072,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 12,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
-  "encoder_attention_heads": 12,
-  "encoder_ffn_dim": 3072,
   "encoder_layerdrop": 0.0,
-  "encoder_layers": 12,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
@@ -36,7 +36,7 @@
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
-  "num_hidden_layers": 12,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,
@@ -47,44 +47,28 @@
   "vocab_size": 51865,
   "alignment_heads": [
     [
-      5,
-      3
     ],
     [
-      5,
-      9
-    ],
-    [
-      8,
-      0
-    ],
-    [
-      8,
       4
     ],
     [
-      8,
-      7
     ],
     [
-      8,
-      8
     ],
     [
-      9,
       0
     ],
     [
-      9,
-      7
-    ],
-    [
-      9,
-      9
-    ],
-    [
-      10,
-      5
     ]
   ],
   "lang_ids": [
@@ -282,4 +266,4 @@
     220,
     50257
   ]
-}

 {
+  "_name_or_path": "/leonardo_work/EUHPC_A01_006/experiments_whisper/stage1_results/medium_250210_124500/",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "apply_spec_augment": false,
   "begin_suppress_tokens": null,
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 24,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
   "encoder_layerdrop": 0.0,
+  "encoder_layers": 24,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
+  "num_hidden_layers": 24,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,
   "vocab_size": 51865,
   "alignment_heads": [
     [
+      13,
+      15
     ],
     [
+      15,
       4
     ],
     [
+      15,
+      15
     ],
     [
+      16,
+      1
     ],
     [
+      20,
       0
     ],
     [
+      23,
+      4
     ]
   ],
   "lang_ids": [
     220,
     50257
   ]
+}

generation_config.json CHANGED Viewed

@@ -237,4 +237,4 @@
     "translate": 50358
   },
   "transformers_version": "4.45.2"
-}

     "translate": 50358
   },
   "transformers_version": "4.45.2"
+}

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4fe050cc61ebda02dacb2a0fd90bb5ae61300656d9339ca6107aeb53c69594da
-size 563189936

 version https://git-lfs.github.com/spec/v1
+oid sha256:f5d9eaecc00a1ca51b8f5e5f3da6270b4d234b5d3c94e1015316059a644d0320
+size 1634047376