ahmedr996 commited on
Commit
d2446b3
·
verified ·
1 Parent(s): 02277f7

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
- "eval_loss": 0.24726401269435883,
5
- "eval_runtime": 13.288,
6
- "eval_samples_per_second": 0.677,
7
- "eval_steps_per_second": 0.075
8
  }
 
1
  {
2
+ "epoch": 3.6923076923076925,
3
  "eval_accuracy": 1.0,
4
+ "eval_loss": 0.0028692723717540503,
5
+ "eval_runtime": 25.884,
6
+ "eval_samples_per_second": 0.889,
7
+ "eval_steps_per_second": 0.116
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae97de9d2f80c1f70886a6f3a2fff46bbfa607423ff450b3059f929f12622b8f
3
  size 344940444
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:674d55e0efe8bdad1c17e5fdfe988d9500c2d0322be92ae643e7ccabc1078c5a
3
  size 344940444
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
- "eval_loss": 0.24726401269435883,
5
- "eval_runtime": 13.288,
6
- "eval_samples_per_second": 0.677,
7
- "eval_steps_per_second": 0.075
8
  }
 
1
  {
2
+ "epoch": 3.6923076923076925,
3
  "eval_accuracy": 1.0,
4
+ "eval_loss": 0.0028692723717540503,
5
+ "eval_runtime": 25.884,
6
+ "eval_samples_per_second": 0.889,
7
+ "eval_steps_per_second": 0.116
8
  }
trainer_state.json CHANGED
@@ -1,79 +1,109 @@
1
  {
2
  "best_metric": 1.0,
3
- "best_model_checkpoint": "videomae-base-finetuned-soccer\\checkpoint-4",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
11
  {
12
  "epoch": 1.0,
13
  "eval_accuracy": 1.0,
14
- "eval_loss": 0.20363736152648926,
15
- "eval_runtime": 9.1182,
16
- "eval_samples_per_second": 0.768,
17
- "eval_steps_per_second": 0.11,
18
- "step": 4
 
 
 
 
 
 
 
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 1.0,
23
- "eval_loss": 0.010900563560426235,
24
- "eval_runtime": 9.0053,
25
- "eval_samples_per_second": 0.777,
26
- "eval_steps_per_second": 0.111,
27
- "step": 8
28
  },
29
  {
30
- "epoch": 2.5,
31
- "grad_norm": 0.2005084902048111,
32
- "learning_rate": 1e-05,
33
- "loss": 0.4029,
34
- "step": 10
35
  },
36
  {
37
  "epoch": 3.0,
38
  "eval_accuracy": 1.0,
39
- "eval_loss": 0.004224988166242838,
40
- "eval_runtime": 9.5263,
41
- "eval_samples_per_second": 0.735,
42
- "eval_steps_per_second": 0.105,
43
- "step": 12
44
  },
45
  {
46
- "epoch": 3.0,
47
- "step": 12,
48
- "total_flos": 2.09338851031253e+17,
49
- "train_loss": 0.3365984517149627,
50
- "train_runtime": 293.1214,
51
- "train_samples_per_second": 0.655,
52
- "train_steps_per_second": 0.041
53
  },
54
  {
55
- "epoch": 3.0,
56
  "eval_accuracy": 1.0,
57
- "eval_loss": 0.24726401269435883,
58
- "eval_runtime": 15.5309,
59
- "eval_samples_per_second": 0.579,
60
- "eval_steps_per_second": 0.064,
61
- "step": 12
62
  },
63
  {
64
- "epoch": 3.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  "eval_accuracy": 1.0,
66
- "eval_loss": 0.24726401269435883,
67
- "eval_runtime": 13.288,
68
- "eval_samples_per_second": 0.677,
69
- "eval_steps_per_second": 0.075,
70
- "step": 12
71
  }
72
  ],
73
  "logging_steps": 10,
74
- "max_steps": 12,
75
  "num_input_tokens_seen": 0,
76
- "num_train_epochs": 3,
77
  "save_steps": 500,
78
  "stateful_callbacks": {
79
  "TrainerControl": {
@@ -87,8 +117,8 @@
87
  "attributes": {}
88
  }
89
  },
90
- "total_flos": 2.09338851031253e+17,
91
- "train_batch_size": 16,
92
  "trial_name": null,
93
  "trial_params": null
94
  }
 
1
  {
2
  "best_metric": 1.0,
3
+ "best_model_checkpoint": "videomae-base-finetuned-soccer\\checkpoint-13",
4
+ "epoch": 3.6923076923076925,
5
  "eval_steps": 500,
6
+ "global_step": 48,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 0.7692307692307693,
13
+ "grad_norm": 0.3097344934940338,
14
+ "learning_rate": 4.418604651162791e-05,
15
+ "loss": 0.4706,
16
+ "step": 10
17
+ },
18
  {
19
  "epoch": 1.0,
20
  "eval_accuracy": 1.0,
21
+ "eval_loss": 0.002405111910775304,
22
+ "eval_runtime": 14.963,
23
+ "eval_samples_per_second": 0.802,
24
+ "eval_steps_per_second": 0.134,
25
+ "step": 13
26
+ },
27
+ {
28
+ "epoch": 1.5384615384615383,
29
+ "grad_norm": 0.024141477420926094,
30
+ "learning_rate": 3.2558139534883724e-05,
31
+ "loss": 0.0027,
32
+ "step": 20
33
  },
34
  {
35
  "epoch": 2.0,
36
  "eval_accuracy": 1.0,
37
+ "eval_loss": 0.000666652515064925,
38
+ "eval_runtime": 14.6823,
39
+ "eval_samples_per_second": 0.817,
40
+ "eval_steps_per_second": 0.136,
41
+ "step": 26
42
  },
43
  {
44
+ "epoch": 2.3076923076923075,
45
+ "grad_norm": 0.013116070069372654,
46
+ "learning_rate": 2.0930232558139536e-05,
47
+ "loss": 0.0008,
48
+ "step": 30
49
  },
50
  {
51
  "epoch": 3.0,
52
  "eval_accuracy": 1.0,
53
+ "eval_loss": 0.0004932748270221055,
54
+ "eval_runtime": 15.7105,
55
+ "eval_samples_per_second": 0.764,
56
+ "eval_steps_per_second": 0.127,
57
+ "step": 39
58
  },
59
  {
60
+ "epoch": 3.076923076923077,
61
+ "grad_norm": 0.011234880425035954,
62
+ "learning_rate": 9.302325581395349e-06,
63
+ "loss": 0.0005,
64
+ "step": 40
 
 
65
  },
66
  {
67
+ "epoch": 3.6923076923076925,
68
  "eval_accuracy": 1.0,
69
+ "eval_loss": 0.00047058644122444093,
70
+ "eval_runtime": 15.9668,
71
+ "eval_samples_per_second": 0.752,
72
+ "eval_steps_per_second": 0.125,
73
+ "step": 48
74
  },
75
  {
76
+ "epoch": 3.6923076923076925,
77
+ "step": 48,
78
+ "total_flos": 4.523254798444462e+17,
79
+ "train_loss": 0.09896005064365454,
80
+ "train_runtime": 623.0335,
81
+ "train_samples_per_second": 0.616,
82
+ "train_steps_per_second": 0.077
83
+ },
84
+ {
85
+ "epoch": 3.6923076923076925,
86
+ "eval_accuracy": 1.0,
87
+ "eval_loss": 0.0028692723717540503,
88
+ "eval_runtime": 32.8199,
89
+ "eval_samples_per_second": 0.701,
90
+ "eval_steps_per_second": 0.091,
91
+ "step": 48
92
+ },
93
+ {
94
+ "epoch": 3.6923076923076925,
95
  "eval_accuracy": 1.0,
96
+ "eval_loss": 0.0028692723717540503,
97
+ "eval_runtime": 25.884,
98
+ "eval_samples_per_second": 0.889,
99
+ "eval_steps_per_second": 0.116,
100
+ "step": 48
101
  }
102
  ],
103
  "logging_steps": 10,
104
+ "max_steps": 48,
105
  "num_input_tokens_seen": 0,
106
+ "num_train_epochs": 4,
107
  "save_steps": 500,
108
  "stateful_callbacks": {
109
  "TrainerControl": {
 
117
  "attributes": {}
118
  }
119
  },
120
+ "total_flos": 4.523254798444462e+17,
121
+ "train_batch_size": 8,
122
  "trial_name": null,
123
  "trial_params": null
124
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f9b09f5c64af0e0c1bcc149348b0dbadf5b840eb6b6102ecd7c363cb80ddac4
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ead260bf9961cab0d9166afe1d69a5f0f6c4275c04c12fd81197181a4a370ad
3
  size 5368