ShaySha commited on
Commit
38f307d
·
verified ·
1 Parent(s): 85d052e

End of training

Browse files
Files changed (2) hide show
  1. README.md +3 -1
  2. trainer_state.json +12 -82
README.md CHANGED
@@ -3,6 +3,8 @@ base_model: facebook/musicgen-melody
3
  library_name: peft
4
  license: cc-by-nc-4.0
5
  tags:
 
 
6
  - generated_from_trainer
7
  model-index:
8
  - name: musicgen-melody-lora-regular3_techno-colab
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # musicgen-melody-lora-regular3_techno-colab
16
 
17
- This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on an unknown dataset.
18
 
19
  ## Model description
20
 
 
3
  library_name: peft
4
  license: cc-by-nc-4.0
5
  tags:
6
+ - text-to-audio
7
+ - classic_techno_clips
8
  - generated_from_trainer
9
  model-index:
10
  - name: musicgen-melody-lora-regular3_techno-colab
 
16
 
17
  # musicgen-melody-lora-regular3_techno-colab
18
 
19
+ This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on the ShaySha/classic_techno_clips dataset.
20
 
21
  ## Model description
22
 
trainer_state.json CHANGED
@@ -3,100 +3,30 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 22,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.18181818181818182,
13
- "grad_norm": 0.9673512578010559,
14
- "learning_rate": 0.00018181818181818183,
15
- "loss": 9.4696,
16
- "step": 2
17
- },
18
- {
19
- "epoch": 0.36363636363636365,
20
- "grad_norm": 1.2611587047576904,
21
- "learning_rate": 0.00016363636363636366,
22
- "loss": 9.1349,
23
- "step": 4
24
- },
25
- {
26
- "epoch": 0.5454545454545454,
27
- "grad_norm": 2.2909739017486572,
28
- "learning_rate": 0.00014545454545454546,
29
- "loss": 8.631,
30
- "step": 6
31
- },
32
- {
33
- "epoch": 0.7272727272727273,
34
- "grad_norm": 2.0307061672210693,
35
- "learning_rate": 0.00012727272727272728,
36
- "loss": 8.0002,
37
- "step": 8
38
- },
39
- {
40
- "epoch": 0.9090909090909091,
41
- "grad_norm": 1.1030476093292236,
42
- "learning_rate": 0.00010909090909090909,
43
- "loss": 7.5263,
44
- "step": 10
45
- },
46
- {
47
- "epoch": 1.0909090909090908,
48
- "grad_norm": 0.8558670878410339,
49
- "learning_rate": 9.090909090909092e-05,
50
- "loss": 7.4314,
51
- "step": 12
52
- },
53
- {
54
- "epoch": 1.2727272727272727,
55
- "grad_norm": 0.947796642780304,
56
- "learning_rate": 7.272727272727273e-05,
57
- "loss": 7.3711,
58
- "step": 14
59
- },
60
- {
61
- "epoch": 1.4545454545454546,
62
- "grad_norm": 0.7418118715286255,
63
- "learning_rate": 5.4545454545454546e-05,
64
- "loss": 7.2495,
65
- "step": 16
66
- },
67
- {
68
- "epoch": 1.6363636363636362,
69
- "grad_norm": 0.7568270564079285,
70
- "learning_rate": 3.6363636363636364e-05,
71
- "loss": 7.2816,
72
- "step": 18
73
- },
74
- {
75
- "epoch": 1.8181818181818183,
76
- "grad_norm": 0.955255389213562,
77
- "learning_rate": 1.8181818181818182e-05,
78
- "loss": 7.3431,
79
- "step": 20
80
- },
81
  {
82
  "epoch": 2.0,
83
- "grad_norm": 0.8418056964874268,
84
  "learning_rate": 0.0,
85
- "loss": 7.1887,
86
- "step": 22
87
  },
88
  {
89
  "epoch": 2.0,
90
- "step": 22,
91
- "total_flos": 26016036946944.0,
92
- "train_loss": 7.875224590301514,
93
- "train_runtime": 563.2063,
94
- "train_samples_per_second": 0.625,
95
- "train_steps_per_second": 0.039
96
  }
97
  ],
98
  "logging_steps": 2,
99
- "max_steps": 22,
100
  "num_input_tokens_seen": 0,
101
  "num_train_epochs": 2,
102
  "save_steps": 500,
@@ -112,7 +42,7 @@
112
  "attributes": {}
113
  }
114
  },
115
- "total_flos": 26016036946944.0,
116
  "train_batch_size": 2,
117
  "trial_name": null,
118
  "trial_params": null
 
3
  "best_model_checkpoint": null,
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 2,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 2.0,
13
+ "grad_norm": 0.3880564868450165,
14
  "learning_rate": 0.0,
15
+ "loss": 3.5507,
16
+ "step": 2
17
  },
18
  {
19
  "epoch": 2.0,
20
+ "step": 2,
21
+ "total_flos": 739091958720.0,
22
+ "train_loss": 3.5507075786590576,
23
+ "train_runtime": 18.2944,
24
+ "train_samples_per_second": 0.547,
25
+ "train_steps_per_second": 0.109
26
  }
27
  ],
28
  "logging_steps": 2,
29
+ "max_steps": 2,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 2,
32
  "save_steps": 500,
 
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 739091958720.0,
46
  "train_batch_size": 2,
47
  "trial_name": null,
48
  "trial_params": null