Mikhail Biriuchinskii commited on
Commit
b459b62
1 Parent(s): 25e35db

fekpghojezpoh/sarcasm_BARThez

Browse files
README.md CHANGED
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model is a fine-tuned version of [moussaKam/barthez-orangesum-abstract](https://huggingface.co/moussaKam/barthez-orangesum-abstract) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 12.3591
19
 
20
  ## Model description
21
 
@@ -46,7 +46,7 @@ The following hyperparameters were used during training:
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
- | No log | 1.0 | 5 | 12.3591 |
50
 
51
 
52
  ### Framework versions
 
15
 
16
  This model is a fine-tuned version of [moussaKam/barthez-orangesum-abstract](https://huggingface.co/moussaKam/barthez-orangesum-abstract) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 1.2689
19
 
20
  ## Model description
21
 
 
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
+ | No log | 1.0 | 5 | 1.2689 |
50
 
51
 
52
  ### Framework versions
config.json CHANGED
@@ -19,6 +19,7 @@
19
  "decoder_start_token_id": 2,
20
  "do_blenderbot_90_layernorm": false,
21
  "dropout": 0.1,
 
22
  "encoder_attention_heads": 12,
23
  "encoder_ffn_dim": 3072,
24
  "encoder_layerdrop": 0.0,
@@ -26,6 +27,7 @@
26
  "eos_token_id": 2,
27
  "extra_pos_embeddings": 2,
28
  "force_bos_token_to_be_generated": false,
 
29
  "id2label": {
30
  "0": "LABEL_0",
31
  "1": "LABEL_1",
@@ -42,7 +44,6 @@
42
  "model_type": "mbart",
43
  "normalize_before": true,
44
  "normalize_embedding": true,
45
- "num_beams": 2,
46
  "num_hidden_layers": 6,
47
  "pad_token_id": 1,
48
  "scale_embedding": false,
 
19
  "decoder_start_token_id": 2,
20
  "do_blenderbot_90_layernorm": false,
21
  "dropout": 0.1,
22
+ "early_stopping": true,
23
  "encoder_attention_heads": 12,
24
  "encoder_ffn_dim": 3072,
25
  "encoder_layerdrop": 0.0,
 
27
  "eos_token_id": 2,
28
  "extra_pos_embeddings": 2,
29
  "force_bos_token_to_be_generated": false,
30
+ "forced_eos_token_id": 2,
31
  "id2label": {
32
  "0": "LABEL_0",
33
  "1": "LABEL_1",
 
44
  "model_type": "mbart",
45
  "normalize_before": true,
46
  "normalize_embedding": true,
 
47
  "num_hidden_layers": 6,
48
  "pad_token_id": 1,
49
  "scale_embedding": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:887c0ec1471a11e4e09da0ff289cd295b3446e027bc6b1eee2f1ca7a36e2fb80
3
  size 557116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e1209921a56568d60eeae837eb6bd98a7ac88eec576e1e5f3315592b311754e
3
  size 557116312
runs/Feb27_12-43-53_aa9548bf9a52/events.out.tfevents.1709037834.aa9548bf9a52.4055.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed1c6c2773cc40a8ccb99f80f312a2feb2bcbe4dac695bdc4156a3cb8fd335b1
3
+ size 6301
runs/Feb27_12-43-53_aa9548bf9a52/events.out.tfevents.1709037864.aa9548bf9a52.4055.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56d612c014112a6709bbc024e390066b152c83294b111262c607c2ffea897c6e
3
+ size 354
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08cac45b34f92a57d8587b674dceca13a552f95a665ecf24f89b8e5ff6e3cfa8
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d461d26b86b2dd1e52391f36ee6ac53d7c7f2fb11557dc3f25ffaccdf045f53
3
  size 5112