andro-flock commited on
Commit
f60331a
·
verified ·
1 Parent(s): 7c0fe75

End of training

Browse files
Files changed (4) hide show
  1. README.md +3 -1
  2. all_results.json +6 -6
  3. train_results.json +6 -6
  4. trainer_state.json +18 -39
README.md CHANGED
@@ -2,6 +2,8 @@
2
  library_name: transformers
3
  base_model: andro-flock/b2-classification
4
  tags:
 
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: b2-segmentation
@@ -13,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # b2-segmentation
15
 
16
- This model is a fine-tuned version of [andro-flock/b2-classification](https://huggingface.co/andro-flock/b2-classification) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
2
  library_name: transformers
3
  base_model: andro-flock/b2-classification
4
  tags:
5
+ - image-segmentation
6
+ - vision
7
  - generated_from_trainer
8
  model-index:
9
  - name: b2-segmentation
 
15
 
16
  # b2-segmentation
17
 
18
+ This model is a fine-tuned version of [andro-flock/b2-classification](https://huggingface.co/andro-flock/b2-classification) on the andro-flock/semantic-segment-4class dataset.
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 500.0,
3
- "total_flos": 7.8886713950208e+16,
4
- "train_loss": 0.1895984401702881,
5
- "train_runtime": 397.1334,
6
- "train_samples_per_second": 20.144,
7
- "train_steps_per_second": 2.518
8
  }
 
1
  {
2
+ "epoch": 250.0,
3
+ "total_flos": 2.903671701504e+17,
4
+ "train_loss": 0.08589911651611327,
5
+ "train_runtime": 1399.8181,
6
+ "train_samples_per_second": 2.858,
7
+ "train_steps_per_second": 0.357
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 500.0,
3
- "total_flos": 7.8886713950208e+16,
4
- "train_loss": 0.1895984401702881,
5
- "train_runtime": 397.1334,
6
- "train_samples_per_second": 20.144,
7
- "train_steps_per_second": 2.518
8
  }
 
1
  {
2
+ "epoch": 250.0,
3
+ "total_flos": 2.903671701504e+17,
4
+ "train_loss": 0.08589911651611327,
5
+ "train_runtime": 1399.8181,
6
+ "train_samples_per_second": 2.858,
7
+ "train_steps_per_second": 0.357
8
  }
trainer_state.json CHANGED
@@ -1,62 +1,41 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 500.0,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 100.0,
13
- "grad_norm": 1.8578704595565796,
14
- "learning_rate": 4.8020000000000004e-05,
15
- "loss": 0.4234,
16
  "step": 200
17
  },
18
  {
19
  "epoch": 200.0,
20
- "grad_norm": 0.6928507685661316,
21
- "learning_rate": 3.604e-05,
22
- "loss": 0.1814,
23
- "step": 400
24
- },
25
- {
26
- "epoch": 300.0,
27
- "grad_norm": 1.1086845397949219,
28
- "learning_rate": 2.406e-05,
29
- "loss": 0.1281,
30
- "step": 600
31
- },
32
- {
33
- "epoch": 400.0,
34
- "grad_norm": 1.4631288051605225,
35
  "learning_rate": 1.2079999999999998e-05,
36
- "loss": 0.1144,
37
- "step": 800
38
- },
39
- {
40
- "epoch": 500.0,
41
- "grad_norm": 0.9606817364692688,
42
- "learning_rate": 1e-07,
43
- "loss": 0.1007,
44
- "step": 1000
45
  },
46
  {
47
- "epoch": 500.0,
48
- "step": 1000,
49
- "total_flos": 7.8886713950208e+16,
50
- "train_loss": 0.1895984401702881,
51
- "train_runtime": 397.1334,
52
- "train_samples_per_second": 20.144,
53
- "train_steps_per_second": 2.518
54
  }
55
  ],
56
  "logging_steps": 200,
57
- "max_steps": 1000,
58
  "num_input_tokens_seen": 0,
59
- "num_train_epochs": 500,
60
  "save_steps": 500,
61
  "stateful_callbacks": {
62
  "TrainerControl": {
@@ -70,7 +49,7 @@
70
  "attributes": {}
71
  }
72
  },
73
- "total_flos": 7.8886713950208e+16,
74
  "train_batch_size": 8,
75
  "trial_name": null,
76
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 250.0,
5
  "eval_steps": 500,
6
+ "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 100.0,
13
+ "grad_norm": 0.17752039432525635,
14
+ "learning_rate": 3.604e-05,
15
+ "loss": 0.1262,
16
  "step": 200
17
  },
18
  {
19
  "epoch": 200.0,
20
+ "grad_norm": 0.3985879421234131,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  "learning_rate": 1.2079999999999998e-05,
22
+ "loss": 0.062,
23
+ "step": 400
 
 
 
 
 
 
 
24
  },
25
  {
26
+ "epoch": 250.0,
27
+ "step": 500,
28
+ "total_flos": 2.903671701504e+17,
29
+ "train_loss": 0.08589911651611327,
30
+ "train_runtime": 1399.8181,
31
+ "train_samples_per_second": 2.858,
32
+ "train_steps_per_second": 0.357
33
  }
34
  ],
35
  "logging_steps": 200,
36
+ "max_steps": 500,
37
  "num_input_tokens_seen": 0,
38
+ "num_train_epochs": 250,
39
  "save_steps": 500,
40
  "stateful_callbacks": {
41
  "TrainerControl": {
 
49
  "attributes": {}
50
  }
51
  },
52
+ "total_flos": 2.903671701504e+17,
53
  "train_batch_size": 8,
54
  "trial_name": null,
55
  "trial_params": null