istvanj
/

musicgen-melody-lora-dnb-colab-gs-3-lr-0.0001

Text-to-Audio

PEFT

Safetensors

dnb

Generated from Trainer

Model card Files Files and versions Community

istvanj commited on Nov 29, 2024

Commit

4cea407

verified ·

1 Parent(s): d1cbf7b

End of training

Browse files

Files changed (2) hide show

README.md +3 -1
trainer_state.json +42 -70

README.md CHANGED Viewed

@@ -3,6 +3,8 @@ library_name: peft
 license: cc-by-nc-4.0
 base_model: facebook/musicgen-melody
 tags:
 - generated_from_trainer
 model-index:
 - name: musicgen-melody-lora-dnb-colab-gs-3-lr-0.0001
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # musicgen-melody-lora-dnb-colab-gs-3-lr-0.0001
-This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on an unknown dataset.
 ## Model description

 license: cc-by-nc-4.0
 base_model: facebook/musicgen-melody
 tags:
+- text-to-audio
+- dnb
 - generated_from_trainer
 model-index:
 - name: musicgen-melody-lora-dnb-colab-gs-3-lr-0.0001
 # musicgen-melody-lora-dnb-colab-gs-3-lr-0.0001
+This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on the istvanj/ncs-dnb dataset.
 ## Model description

trainer_state.json CHANGED Viewed

@@ -1,125 +1,97 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.533333333333333,
   "eval_steps": 500,
-  "global_step": 28,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 0.26666666666666666,
-      "grad_norm": 7.983949184417725,
-      "learning_rate": 9.285714285714288e-06,
-      "loss": 9.7008,
       "step": 2
     },
     {
       "epoch": 0.5333333333333333,
-      "grad_norm": 8.53835678100586,
-      "learning_rate": 8.571428571428571e-06,
-      "loss": 9.6854,
       "step": 4
     },
     {
       "epoch": 0.8,
-      "grad_norm": 8.521801948547363,
-      "learning_rate": 7.857142857142858e-06,
-      "loss": 9.6866,
       "step": 6
     },
     {
       "epoch": 1.0,
-      "grad_norm": 4.384256839752197,
-      "learning_rate": 7.1428571428571436e-06,
-      "loss": 7.2247,
       "step": 8
     },
     {
       "epoch": 1.2666666666666666,
-      "grad_norm": 8.3870210647583,
-      "learning_rate": 6.4285714285714295e-06,
-      "loss": 9.6508,
       "step": 10
     },
     {
       "epoch": 1.5333333333333332,
-      "grad_norm": 8.580151557922363,
-      "learning_rate": 5.7142857142857145e-06,
-      "loss": 9.6305,
       "step": 12
     },
     {
       "epoch": 1.8,
-      "grad_norm": 9.1837797164917,
-      "learning_rate": 5e-06,
-      "loss": 9.5792,
       "step": 14
     },
     {
       "epoch": 2.0,
-      "grad_norm": 4.785982131958008,
-      "learning_rate": 4.2857142857142855e-06,
-      "loss": 7.2215,
       "step": 16
     },
     {
       "epoch": 2.2666666666666666,
-      "grad_norm": 8.567254066467285,
-      "learning_rate": 3.5714285714285718e-06,
-      "loss": 9.608,
       "step": 18
     },
     {
       "epoch": 2.533333333333333,
-      "grad_norm": 9.062423706054688,
-      "learning_rate": 2.8571428571428573e-06,
-      "loss": 9.5627,
       "step": 20
     },
     {
-      "epoch": 2.8,
-      "grad_norm": 9.304347038269043,
-      "learning_rate": 2.1428571428571427e-06,
-      "loss": 9.5904,
-      "step": 22
-    },
-    {
-      "epoch": 3.0,
-      "grad_norm": 5.326416969299316,
-      "learning_rate": 1.4285714285714286e-06,
-      "loss": 7.1593,
-      "step": 24
-    },
-    {
-      "epoch": 3.2666666666666666,
-      "grad_norm": 9.835756301879883,
-      "learning_rate": 7.142857142857143e-07,
-      "loss": 9.5721,
-      "step": 26
-    },
-    {
-      "epoch": 3.533333333333333,
-      "grad_norm": 9.394722938537598,
-      "learning_rate": 0.0,
-      "loss": 9.5758,
-      "step": 28
-    },
-    {
-      "epoch": 3.533333333333333,
-      "step": 28,
-      "total_flos": 108812813622552.0,
-      "train_loss": 9.103422130857195,
-      "train_runtime": 670.6646,
-      "train_samples_per_second": 0.716,
-      "train_steps_per_second": 0.042
     }
   ],
   "logging_steps": 2,
-  "max_steps": 28,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 4,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -133,7 +105,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 108812813622552.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.6666666666666665,
   "eval_steps": 500,
+  "global_step": 21,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 0.26666666666666666,
+      "grad_norm": 8.077447891235352,
+      "learning_rate": 9.047619047619048e-05,
+      "loss": 9.6711,
       "step": 2
     },
     {
       "epoch": 0.5333333333333333,
+      "grad_norm": 10.438846588134766,
+      "learning_rate": 8.095238095238096e-05,
+      "loss": 9.4926,
       "step": 4
     },
     {
       "epoch": 0.8,
+      "grad_norm": 11.99673080444336,
+      "learning_rate": 7.142857142857143e-05,
+      "loss": 9.2985,
       "step": 6
     },
     {
       "epoch": 1.0,
+      "grad_norm": 8.44992733001709,
+      "learning_rate": 6.19047619047619e-05,
+      "loss": 6.8146,
       "step": 8
     },
     {
       "epoch": 1.2666666666666666,
+      "grad_norm": 15.83218002319336,
+      "learning_rate": 5.2380952380952384e-05,
+      "loss": 8.8302,
       "step": 10
     },
     {
       "epoch": 1.5333333333333332,
+      "grad_norm": 16.710369110107422,
+      "learning_rate": 4.761904761904762e-05,
+      "loss": 8.5759,
       "step": 12
     },
     {
       "epoch": 1.8,
+      "grad_norm": 19.962966918945312,
+      "learning_rate": 3.809523809523809e-05,
+      "loss": 8.3464,
       "step": 14
     },
     {
       "epoch": 2.0,
+      "grad_norm": 9.256256103515625,
+      "learning_rate": 2.857142857142857e-05,
+      "loss": 6.1951,
       "step": 16
     },
     {
       "epoch": 2.2666666666666666,
+      "grad_norm": 18.415756225585938,
+      "learning_rate": 1.9047619047619046e-05,
+      "loss": 8.0719,
       "step": 18
     },
     {
       "epoch": 2.533333333333333,
+      "grad_norm": 14.65276050567627,
+      "learning_rate": 9.523809523809523e-06,
+      "loss": 7.9604,
       "step": 20
     },
     {
+      "epoch": 2.6666666666666665,
+      "step": 21,
+      "total_flos": 82187025809664.0,
+      "train_loss": 8.305864515758696,
+      "train_runtime": 507.9977,
+      "train_samples_per_second": 0.709,
+      "train_steps_per_second": 0.041
     }
   ],
   "logging_steps": 2,
+  "max_steps": 21,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 82187025809664.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null