hugosousa commited on
Commit
fa7f00b
·
verified ·
1 Parent(s): 079555f

End of training

Browse files
Files changed (5) hide show
  1. README.md +19 -19
  2. all_results.json +53 -0
  3. eval_results.json +37 -0
  4. train_results.json +19 -0
  5. trainer_state.json +0 -0
README.md CHANGED
@@ -18,31 +18,31 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [HuggingFaceTB/SmolLM2-135M](https://huggingface.co/HuggingFaceTB/SmolLM2-135M) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.1038
22
- - < Precision: 0.9661
23
- - < Recall: 0.9714
24
- - < F1-score: 0.9687
25
  - < Support: 4865.0
26
- - > Precision: 0.9688
27
- - > Recall: 0.9700
28
- - > F1-score: 0.9694
29
  - > Support: 4865.0
30
- - = Precision: 0.8884
31
- - = Recall: 0.8024
32
- - = F1-score: 0.8432
33
  - = Support: 248.0
34
- - - Precision: 0.4615
35
  - - Recall: 0.2727
36
- - - F1-score: 0.3429
37
  - - Support: 22.0
38
- - Accuracy: 0.965
39
- - Macro Avg Precision: 0.8212
40
- - Macro Avg Recall: 0.7541
41
- - Macro Avg F1-score: 0.7811
42
  - Macro Avg Support: 10000.0
43
- - Weighted Avg Precision: 0.9644
44
- - Weighted Avg Recall: 0.965
45
- - Weighted Avg F1-score: 0.9646
46
  - Weighted Avg Support: 10000.0
47
 
48
  ## Model description
 
18
 
19
  This model is a fine-tuned version of [HuggingFaceTB/SmolLM2-135M](https://huggingface.co/HuggingFaceTB/SmolLM2-135M) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.1047
22
+ - < Precision: 0.9674
23
+ - < Recall: 0.9708
24
+ - < F1-score: 0.9691
25
  - < Support: 4865.0
26
+ - > Precision: 0.9686
27
+ - > Recall: 0.9706
28
+ - > F1-score: 0.9696
29
  - > Support: 4865.0
30
+ - = Precision: 0.8734
31
+ - = Recall: 0.8065
32
+ - = F1-score: 0.8386
33
  - = Support: 248.0
34
+ - - Precision: 0.4286
35
  - - Recall: 0.2727
36
+ - - F1-score: 0.3333
37
  - - Support: 22.0
38
+ - Accuracy: 0.9651
39
+ - Macro Avg Precision: 0.8095
40
+ - Macro Avg Recall: 0.7551
41
+ - Macro Avg F1-score: 0.7777
42
  - Macro Avg Support: 10000.0
43
+ - Weighted Avg Precision: 0.9645
44
+ - Weighted Avg Recall: 0.9651
45
+ - Weighted Avg F1-score: 0.9647
46
  - Weighted Avg Support: 10000.0
47
 
48
  ## Model description
all_results.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "before_init_mem_cpu": 3040526336,
3
+ "before_init_mem_gpu": 512,
4
+ "epoch": 18.0,
5
+ "eval_-_f1-score": 0.3333333333333333,
6
+ "eval_-_precision": 0.42857142857142855,
7
+ "eval_-_recall": 0.2727272727272727,
8
+ "eval_-_support": 22.0,
9
+ "eval_<_f1-score": 0.9691187031907254,
10
+ "eval_<_precision": 0.9674313805817288,
11
+ "eval_<_recall": 0.9708119218910586,
12
+ "eval_<_support": 4865.0,
13
+ "eval_=_f1-score": 0.8385744234800838,
14
+ "eval_=_precision": 0.8733624454148472,
15
+ "eval_=_recall": 0.8064516129032258,
16
+ "eval_=_support": 248.0,
17
+ "eval_>_f1-score": 0.9696098562628337,
18
+ "eval_>_precision": 0.9686153846153847,
19
+ "eval_>_recall": 0.9706063720452209,
20
+ "eval_>_support": 4865.0,
21
+ "eval_accuracy": 0.9651,
22
+ "eval_loss": 0.10465546697378159,
23
+ "eval_macro_avg_f1-score": 0.777659079066744,
24
+ "eval_macro_avg_precision": 0.8094951597958472,
25
+ "eval_macro_avg_recall": 0.7551492948916945,
26
+ "eval_macro_avg_support": 10000.0,
27
+ "eval_mem_cpu_alloc_delta": -175185920,
28
+ "eval_mem_cpu_peaked_delta": 175185920,
29
+ "eval_mem_gpu_alloc_delta": 0,
30
+ "eval_mem_gpu_peaked_delta": 1242359296,
31
+ "eval_runtime": 12.3635,
32
+ "eval_samples": 10000,
33
+ "eval_samples_per_second": 808.83,
34
+ "eval_steps_per_second": 3.235,
35
+ "eval_weighted_avg_f1-score": 0.964721423209796,
36
+ "eval_weighted_avg_precision": 0.964488997057541,
37
+ "eval_weighted_avg_recall": 0.9651,
38
+ "eval_weighted_avg_support": 10000.0,
39
+ "init_mem_cpu_alloc_delta": 18427904,
40
+ "init_mem_cpu_peaked_delta": 0,
41
+ "init_mem_gpu_alloc_delta": 0,
42
+ "init_mem_gpu_peaked_delta": 0,
43
+ "total_flos": 2.949719748897669e+18,
44
+ "train_loss": 0.22952656600628965,
45
+ "train_mem_cpu_alloc_delta": 826355712,
46
+ "train_mem_cpu_peaked_delta": 403324928,
47
+ "train_mem_gpu_alloc_delta": 690193408,
48
+ "train_mem_gpu_peaked_delta": 19408810496,
49
+ "train_runtime": 33563.6304,
50
+ "train_samples": 502272,
51
+ "train_samples_per_second": 448.943,
52
+ "train_steps_per_second": 0.877
53
+ }
eval_results.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 18.0,
3
+ "eval_-_f1-score": 0.3333333333333333,
4
+ "eval_-_precision": 0.42857142857142855,
5
+ "eval_-_recall": 0.2727272727272727,
6
+ "eval_-_support": 22.0,
7
+ "eval_<_f1-score": 0.9691187031907254,
8
+ "eval_<_precision": 0.9674313805817288,
9
+ "eval_<_recall": 0.9708119218910586,
10
+ "eval_<_support": 4865.0,
11
+ "eval_=_f1-score": 0.8385744234800838,
12
+ "eval_=_precision": 0.8733624454148472,
13
+ "eval_=_recall": 0.8064516129032258,
14
+ "eval_=_support": 248.0,
15
+ "eval_>_f1-score": 0.9696098562628337,
16
+ "eval_>_precision": 0.9686153846153847,
17
+ "eval_>_recall": 0.9706063720452209,
18
+ "eval_>_support": 4865.0,
19
+ "eval_accuracy": 0.9651,
20
+ "eval_loss": 0.10465546697378159,
21
+ "eval_macro_avg_f1-score": 0.777659079066744,
22
+ "eval_macro_avg_precision": 0.8094951597958472,
23
+ "eval_macro_avg_recall": 0.7551492948916945,
24
+ "eval_macro_avg_support": 10000.0,
25
+ "eval_mem_cpu_alloc_delta": -175185920,
26
+ "eval_mem_cpu_peaked_delta": 175185920,
27
+ "eval_mem_gpu_alloc_delta": 0,
28
+ "eval_mem_gpu_peaked_delta": 1242359296,
29
+ "eval_runtime": 12.3635,
30
+ "eval_samples": 10000,
31
+ "eval_samples_per_second": 808.83,
32
+ "eval_steps_per_second": 3.235,
33
+ "eval_weighted_avg_f1-score": 0.964721423209796,
34
+ "eval_weighted_avg_precision": 0.964488997057541,
35
+ "eval_weighted_avg_recall": 0.9651,
36
+ "eval_weighted_avg_support": 10000.0
37
+ }
train_results.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "before_init_mem_cpu": 3040526336,
3
+ "before_init_mem_gpu": 512,
4
+ "epoch": 18.0,
5
+ "init_mem_cpu_alloc_delta": 18427904,
6
+ "init_mem_cpu_peaked_delta": 0,
7
+ "init_mem_gpu_alloc_delta": 0,
8
+ "init_mem_gpu_peaked_delta": 0,
9
+ "total_flos": 2.949719748897669e+18,
10
+ "train_loss": 0.22952656600628965,
11
+ "train_mem_cpu_alloc_delta": 826355712,
12
+ "train_mem_cpu_peaked_delta": 403324928,
13
+ "train_mem_gpu_alloc_delta": 690193408,
14
+ "train_mem_gpu_peaked_delta": 19408810496,
15
+ "train_runtime": 33563.6304,
16
+ "train_samples": 502272,
17
+ "train_samples_per_second": 448.943,
18
+ "train_steps_per_second": 0.877
19
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff