zkdeng commited on
Commit
059544c
·
verified ·
1 Parent(s): eaa225d

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 0.96,
3
- "eval_accuracy": 0.78,
4
- "eval_f1": 0.7285479916951179,
5
- "eval_loss": 3.062906503677368,
6
- "eval_runtime": 1.551,
7
- "eval_samples_per_second": 32.237,
8
- "eval_steps_per_second": 4.513,
9
- "train_loss": 3.5844920873641968,
10
- "train_runtime": 75.7789,
11
- "train_samples_per_second": 5.239,
12
- "train_steps_per_second": 0.158
13
  }
 
1
  {
2
+ "epoch": 0.92,
3
+ "eval_accuracy": 0.6923076923076923,
4
+ "eval_f1": 0.40909090909090906,
5
+ "eval_loss": 2.1946330070495605,
6
+ "eval_runtime": 1.6106,
7
+ "eval_samples_per_second": 16.143,
8
+ "eval_steps_per_second": 2.484,
9
+ "train_loss": 3.3007516860961914,
10
+ "train_runtime": 38.8385,
11
+ "train_samples_per_second": 5.201,
12
+ "train_steps_per_second": 0.154
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "eval_accuracy": 0.78,
3
- "eval_f1": 0.7285479916951179,
4
- "eval_loss": 3.062906503677368,
5
- "eval_runtime": 1.551,
6
- "eval_samples_per_second": 32.237,
7
- "eval_steps_per_second": 4.513
8
  }
 
1
  {
2
+ "eval_accuracy": 0.6923076923076923,
3
+ "eval_f1": 0.40909090909090906,
4
+ "eval_loss": 2.1946330070495605,
5
+ "eval_runtime": 1.6106,
6
+ "eval_samples_per_second": 16.143,
7
+ "eval_steps_per_second": 2.484
8
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 0.96,
3
- "train_loss": 3.5844920873641968,
4
- "train_runtime": 75.7789,
5
- "train_samples_per_second": 5.239,
6
- "train_steps_per_second": 0.158
7
  }
 
1
  {
2
+ "epoch": 0.92,
3
+ "train_loss": 3.3007516860961914,
4
+ "train_runtime": 38.8385,
5
+ "train_samples_per_second": 5.201,
6
+ "train_steps_per_second": 0.154
7
  }
trainer_state.json CHANGED
@@ -1,41 +1,35 @@
1
  {
2
- "best_metric": 0.76,
3
- "best_model_checkpoint": "convnext/checkpoint-12",
4
- "epoch": 0.96,
5
  "eval_steps": 500,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.8,
13
- "learning_rate": 0.0001,
14
- "loss": 3.6602,
15
- "step": 10
 
 
 
 
16
  },
17
  {
18
- "epoch": 0.96,
19
- "eval_accuracy": 0.76,
20
- "eval_f1": 0.7543106131341425,
21
- "eval_loss": 3.08089017868042,
22
- "eval_runtime": 2.178,
23
- "eval_samples_per_second": 22.957,
24
- "eval_steps_per_second": 3.214,
25
- "step": 12
26
- },
27
- {
28
- "epoch": 0.96,
29
- "step": 12,
30
  "total_flos": 0.0,
31
- "train_loss": 3.5844920873641968,
32
- "train_runtime": 75.7789,
33
- "train_samples_per_second": 5.239,
34
- "train_steps_per_second": 0.158
35
  }
36
  ],
37
  "logging_steps": 10,
38
- "max_steps": 12,
39
  "num_train_epochs": 1,
40
  "save_steps": 500,
41
  "total_flos": 0.0,
 
1
  {
2
+ "best_metric": 0.68,
3
+ "best_model_checkpoint": "convnext/checkpoint-6",
4
+ "epoch": 0.9230769230769231,
5
  "eval_steps": 500,
6
+ "global_step": 6,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.92,
13
+ "eval_accuracy": 0.68,
14
+ "eval_f1": 0.40476190476190477,
15
+ "eval_loss": 2.135345935821533,
16
+ "eval_runtime": 3.511,
17
+ "eval_samples_per_second": 7.12,
18
+ "eval_steps_per_second": 1.139,
19
+ "step": 6
20
  },
21
  {
22
+ "epoch": 0.92,
23
+ "step": 6,
 
 
 
 
 
 
 
 
 
 
24
  "total_flos": 0.0,
25
+ "train_loss": 3.3007516860961914,
26
+ "train_runtime": 38.8385,
27
+ "train_samples_per_second": 5.201,
28
+ "train_steps_per_second": 0.154
29
  }
30
  ],
31
  "logging_steps": 10,
32
+ "max_steps": 6,
33
  "num_train_epochs": 1,
34
  "save_steps": 500,
35
  "total_flos": 0.0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:908a060e4bf217c1550fa07c16f5e2213522a75fa50b925e0edcbb5f8e9c81ef
3
  size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:646e4e2b8a299f0c95adb8e59dc44753490bfc893f30471602f43c2a5305dcdc
3
  size 4472