jihong008
/

musicgen-melody-lora-punk-colab

PEFT

Safetensors

Generated from Trainer

Model card Files Files and versions Community

jihong008 commited on Jun 10, 2024

Commit

fa647a1

verified ·

1 Parent(s): 4df7963

End of training

Browse files

Files changed (2) hide show

README.md +3 -1
trainer_state.json +19 -103

README.md CHANGED Viewed

@@ -2,6 +2,8 @@
 license: cc-by-nc-4.0
 library_name: peft
 tags:
 - generated_from_trainer
 base_model: facebook/musicgen-melody
 model-index:
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # musicgen-melody-lora-punk-colab
-This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on the None dataset.
 ## Model description

 license: cc-by-nc-4.0
 library_name: peft
 tags:
+- text-to-audio
+- tiny-punk
 - generated_from_trainer
 base_model: facebook/musicgen-melody
 model-index:
 # musicgen-melody-lora-punk-colab
+This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on the ylacombe/tiny-punk dataset.
 ## Model description

trainer_state.json CHANGED Viewed

@@ -1,123 +1,39 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.6721311475409837,
   "eval_steps": 500,
-  "global_step": 28,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.26229508196721313,
-      "grad_norm": 1.3779234886169434,
-      "learning_rate": 0.00018571428571428572,
-      "loss": 9.4061,
-      "step": 2
-    },
-    {
-      "epoch": 0.5245901639344263,
-      "grad_norm": 2.1614365577697754,
-      "learning_rate": 0.00017142857142857143,
-      "loss": 8.9057,
-      "step": 4
-    },
-    {
-      "epoch": 0.7868852459016393,
-      "grad_norm": 2.2431693077087402,
-      "learning_rate": 0.00015714285714285716,
-      "loss": 8.3094,
-      "step": 6
-    },
-    {
-      "epoch": 1.0491803278688525,
-      "grad_norm": 2.040867567062378,
-      "learning_rate": 0.00014285714285714287,
-      "loss": 7.8253,
-      "step": 8
-    },
-    {
-      "epoch": 1.3114754098360657,
-      "grad_norm": 1.7131154537200928,
-      "learning_rate": 0.00012857142857142858,
-      "loss": 7.2788,
-      "step": 10
-    },
-    {
-      "epoch": 1.5737704918032787,
-      "grad_norm": 2.2424774169921875,
-      "learning_rate": 0.00011428571428571428,
-      "loss": 7.4106,
-      "step": 12
-    },
-    {
-      "epoch": 1.8360655737704918,
-      "grad_norm": 1.3827060461044312,
       "learning_rate": 0.0001,
-      "loss": 7.1381,
-      "step": 14
-    },
-    {
-      "epoch": 2.098360655737705,
-      "grad_norm": 1.5854527950286865,
-      "learning_rate": 8.571428571428571e-05,
-      "loss": 6.73,
-      "step": 16
-    },
-    {
-      "epoch": 2.360655737704918,
-      "grad_norm": 1.3298927545547485,
-      "learning_rate": 7.142857142857143e-05,
-      "loss": 6.9203,
-      "step": 18
-    },
-    {
-      "epoch": 2.6229508196721314,
-      "grad_norm": 1.2383928298950195,
-      "learning_rate": 5.714285714285714e-05,
-      "loss": 6.7813,
-      "step": 20
-    },
-    {
-      "epoch": 2.8852459016393444,
-      "grad_norm": 0.7927147746086121,
-      "learning_rate": 4.2857142857142856e-05,
-      "loss": 6.8375,
-      "step": 22
-    },
-    {
-      "epoch": 3.1475409836065573,
-      "grad_norm": 1.323878288269043,
-      "learning_rate": 2.857142857142857e-05,
-      "loss": 6.5755,
-      "step": 24
-    },
-    {
-      "epoch": 3.4098360655737707,
-      "grad_norm": 1.2399470806121826,
-      "learning_rate": 1.4285714285714285e-05,
-      "loss": 6.858,
-      "step": 26
     },
     {
-      "epoch": 3.6721311475409837,
-      "grad_norm": 1.3425202369689941,
       "learning_rate": 0.0,
-      "loss": 6.9506,
-      "step": 28
     },
     {
-      "epoch": 3.6721311475409837,
-      "step": 28,
-      "total_flos": 132611574693336.0,
-      "train_loss": 7.423375640596662,
-      "train_runtime": 122.2841,
-      "train_samples_per_second": 3.991,
-      "train_steps_per_second": 0.229
     }
   ],
   "logging_steps": 2,
-  "max_steps": 28,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 4,
   "save_steps": 500,
@@ -133,7 +49,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 132611574693336.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4.0,
   "eval_steps": 500,
+  "global_step": 4,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 2.0,
+      "grad_norm": 0.663876473903656,
       "learning_rate": 0.0001,
+      "loss": 2.4015,
+      "step": 2
     },
     {
+      "epoch": 4.0,
+      "grad_norm": 0.4160730838775635,
       "learning_rate": 0.0,
+      "loss": 2.3495,
+      "step": 4
     },
     {
+      "epoch": 4.0,
+      "step": 4,
+      "total_flos": 4508460948192.0,
+      "train_loss": 2.3754985332489014,
+      "train_runtime": 5.8402,
+      "train_samples_per_second": 2.74,
+      "train_steps_per_second": 0.685
     }
   ],
   "logging_steps": 2,
+  "max_steps": 4,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 4,
   "save_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 4508460948192.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null