Training in progress, step 112
Browse files- config.json +1 -2
- eval/binary_classification_evaluation_Qnli-dev_results.csv +3 -0
- eval/binary_classification_evaluation_allNLI-dev_results.csv +3 -0
- eval/similarity_evaluation_sts-test_results.csv +3 -0
- runs/Apr11_15-35-46_b9a448a0ca50/events.out.tfevents.1744385751.b9a448a0ca50.31.0 +3 -0
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,4 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "BAAI/bge-m3",
|
3 |
"architectures": [
|
4 |
"XLMRobertaModel"
|
5 |
],
|
@@ -21,7 +20,7 @@
|
|
21 |
"pad_token_id": 1,
|
22 |
"position_embedding_type": "absolute",
|
23 |
"torch_dtype": "float32",
|
24 |
-
"transformers_version": "4.
|
25 |
"type_vocab_size": 1,
|
26 |
"use_cache": true,
|
27 |
"vocab_size": 250002
|
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
"XLMRobertaModel"
|
4 |
],
|
|
|
20 |
"pad_token_id": 1,
|
21 |
"position_embedding_type": "absolute",
|
22 |
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.51.1",
|
24 |
"type_vocab_size": 1,
|
25 |
"use_cache": true,
|
26 |
"vocab_size": 250002
|
eval/binary_classification_evaluation_Qnli-dev_results.csv
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_accuracy,cosine_accuracy_threshold,cosine_f1,cosine_precision,cosine_recall,cosine_f1_threshold,cosine_ap,cosine_mcc
|
2 |
+
0.1509433962264151,56,0.70703125,0.6635605096817017,0.7244582043343653,0.585,0.9512195121951219,0.5038043260574341,0.7579116921492454,0.39539276409398366
|
3 |
+
0.3018867924528302,112,0.69921875,0.6639883518218994,0.6956521739130435,0.676923076923077,0.7154471544715447,0.6639883518218994,0.7520437823272439,0.3994014078011956
|
eval/binary_classification_evaluation_allNLI-dev_results.csv
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_accuracy,cosine_accuracy_threshold,cosine_f1,cosine_precision,cosine_recall,cosine_f1_threshold,cosine_ap,cosine_mcc
|
2 |
+
0.1509433962264151,56,0.78125,0.7955116629600525,0.6857142857142857,0.5581395348837209,0.8888888888888888,0.6457934975624084,0.6859718496364101,0.5238511237227645
|
3 |
+
0.3018867924528302,112,0.7734375,0.7482618689537048,0.6769230769230768,0.5789473684210527,0.8148148148148148,0.694869875907898,0.6542135747366074,0.5058060457173612
|
eval/similarity_evaluation_sts-test_results.csv
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cosine_pearson,cosine_spearman
|
2 |
+
0.1509433962264151,56,0.8834267284176791,0.9131686859687813
|
3 |
+
0.3018867924528302,112,0.9037962998590239,0.9228968065127588
|
runs/Apr11_15-35-46_b9a448a0ca50/events.out.tfevents.1744385751.b9a448a0ca50.31.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4433057a9f91ed12e0e0295055a0faee0af234a85dca592c1acb286e8745b235
|
3 |
+
size 33915
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:376f8d1f23e3afc17ce699417922837d0461cc4b226add78679286487de5c3e6
|
3 |
size 5880
|