oddadmix commited on
Commit
c767c8c
·
verified ·
1 Parent(s): 113c9c0

oddadmix/English-To-EgyptianArabic-Translator

Browse files
README.md CHANGED
@@ -1,5 +1,4 @@
1
  ---
2
- library_name: transformers
3
  license: apache-2.0
4
  base_model: Helsinki-NLP/opus-mt-en-ar
5
  tags:
@@ -16,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [Helsinki-NLP/opus-mt-en-ar](https://huggingface.co/Helsinki-NLP/opus-mt-en-ar) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 1.8338
20
 
21
  ## Model description
22
 
@@ -39,7 +38,7 @@ The following hyperparameters were used during training:
39
  - train_batch_size: 16
40
  - eval_batch_size: 16
41
  - seed: 42
42
- - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - num_epochs: 20
45
  - mixed_precision_training: Native AMP
@@ -48,31 +47,31 @@ The following hyperparameters were used during training:
48
 
49
  | Training Loss | Epoch | Step | Validation Loss |
50
  |:-------------:|:-----:|:-----:|:---------------:|
51
- | 2.1222 | 1.0 | 2019 | 1.9246 |
52
- | 1.9763 | 2.0 | 4038 | 1.8663 |
53
- | 1.8834 | 3.0 | 6057 | 1.8480 |
54
- | 1.8057 | 4.0 | 8076 | 1.8384 |
55
- | 1.7176 | 5.0 | 10095 | 1.8243 |
56
- | 1.6813 | 6.0 | 12114 | 1.8235 |
57
- | 1.5903 | 7.0 | 14133 | 1.8270 |
58
- | 1.5615 | 8.0 | 16152 | 1.8201 |
59
- | 1.4726 | 9.0 | 18171 | 1.8227 |
60
- | 1.4401 | 10.0 | 20190 | 1.8223 |
61
- | 1.4126 | 11.0 | 22209 | 1.8224 |
62
- | 1.4119 | 12.0 | 24228 | 1.8266 |
63
- | 1.3976 | 13.0 | 26247 | 1.8301 |
64
- | 1.3645 | 14.0 | 28266 | 1.8272 |
65
- | 1.3199 | 15.0 | 30285 | 1.8312 |
66
- | 1.3365 | 16.0 | 32304 | 1.8322 |
67
- | 1.2928 | 17.0 | 34323 | 1.8309 |
68
- | 1.2352 | 18.0 | 36342 | 1.8310 |
69
- | 1.2561 | 19.0 | 38361 | 1.8321 |
70
- | 1.2623 | 20.0 | 40380 | 1.8338 |
71
 
72
 
73
  ### Framework versions
74
 
75
- - Transformers 4.46.3
76
  - Pytorch 2.1.1+cu121
77
- - Datasets 3.1.0
78
- - Tokenizers 0.20.3
 
1
  ---
 
2
  license: apache-2.0
3
  base_model: Helsinki-NLP/opus-mt-en-ar
4
  tags:
 
15
 
16
  This model is a fine-tuned version of [Helsinki-NLP/opus-mt-en-ar](https://huggingface.co/Helsinki-NLP/opus-mt-en-ar) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 2.3011
19
 
20
  ## Model description
21
 
 
38
  - train_batch_size: 16
39
  - eval_batch_size: 16
40
  - seed: 42
41
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
  - num_epochs: 20
44
  - mixed_precision_training: Native AMP
 
47
 
48
  | Training Loss | Epoch | Step | Validation Loss |
49
  |:-------------:|:-----:|:-----:|:---------------:|
50
+ | 2.9907 | 1.0 | 2396 | 2.7717 |
51
+ | 2.6732 | 2.0 | 4792 | 2.5879 |
52
+ | 2.4873 | 3.0 | 7188 | 2.5003 |
53
+ | 2.2897 | 4.0 | 9584 | 2.4407 |
54
+ | 2.2402 | 5.0 | 11980 | 2.4038 |
55
+ | 2.1045 | 6.0 | 14376 | 2.3795 |
56
+ | 2.032 | 7.0 | 16772 | 2.3621 |
57
+ | 1.9792 | 8.0 | 19168 | 2.3410 |
58
+ | 1.9129 | 9.0 | 21564 | 2.3319 |
59
+ | 1.8975 | 10.0 | 23960 | 2.3192 |
60
+ | 1.8107 | 11.0 | 26356 | 2.3170 |
61
+ | 1.7901 | 12.0 | 28752 | 2.3128 |
62
+ | 1.7654 | 13.0 | 31148 | 2.3061 |
63
+ | 1.6899 | 14.0 | 33544 | 2.3042 |
64
+ | 1.6535 | 15.0 | 35940 | 2.3061 |
65
+ | 1.6733 | 16.0 | 38336 | 2.3027 |
66
+ | 1.6643 | 17.0 | 40732 | 2.3029 |
67
+ | 1.6471 | 18.0 | 43128 | 2.2996 |
68
+ | 1.6138 | 19.0 | 45524 | 2.3013 |
69
+ | 1.5878 | 20.0 | 47920 | 2.3011 |
70
 
71
 
72
  ### Framework versions
73
 
74
+ - Transformers 4.35.2
75
  - Pytorch 2.1.1+cu121
76
+ - Datasets 2.14.5
77
+ - Tokenizers 0.15.1
config.json CHANGED
@@ -8,6 +8,11 @@
8
  "MarianMTModel"
9
  ],
10
  "attention_dropout": 0.0,
 
 
 
 
 
11
  "bos_token_id": 0,
12
  "classif_dropout": 0.0,
13
  "classifier_dropout": 0.0,
@@ -38,19 +43,19 @@
38
  "LABEL_1": 1,
39
  "LABEL_2": 2
40
  },
41
- "max_length": null,
42
  "max_position_embeddings": 512,
43
  "model_type": "marian",
44
  "normalize_before": false,
45
  "normalize_embedding": false,
46
- "num_beams": null,
47
  "num_hidden_layers": 6,
48
  "pad_token_id": 62801,
49
  "scale_embedding": true,
50
  "share_encoder_decoder_embeddings": true,
51
  "static_position_embeddings": true,
52
  "torch_dtype": "float32",
53
- "transformers_version": "4.46.3",
54
  "use_cache": true,
55
  "vocab_size": 62802
56
  }
 
8
  "MarianMTModel"
9
  ],
10
  "attention_dropout": 0.0,
11
+ "bad_words_ids": [
12
+ [
13
+ 62801
14
+ ]
15
+ ],
16
  "bos_token_id": 0,
17
  "classif_dropout": 0.0,
18
  "classifier_dropout": 0.0,
 
43
  "LABEL_1": 1,
44
  "LABEL_2": 2
45
  },
46
+ "max_length": 512,
47
  "max_position_embeddings": 512,
48
  "model_type": "marian",
49
  "normalize_before": false,
50
  "normalize_embedding": false,
51
+ "num_beams": 4,
52
  "num_hidden_layers": 6,
53
  "pad_token_id": 62801,
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
  "torch_dtype": "float32",
58
+ "transformers_version": "4.35.2",
59
  "use_cache": true,
60
  "vocab_size": 62802
61
  }
generation_config.json CHANGED
@@ -12,5 +12,5 @@
12
  "num_beams": 4,
13
  "pad_token_id": 62801,
14
  "renormalize_logits": true,
15
- "transformers_version": "4.46.3"
16
  }
 
12
  "num_beams": 4,
13
  "pad_token_id": 62801,
14
  "renormalize_logits": true,
15
+ "transformers_version": "4.35.2"
16
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0710204ebe8eca4fd75b4a52492ecfdeda7663e44497a25e2650d9450ba367c6
3
  size 305452744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1223ea902922c7d3e3e45d91653ad8b5bc298a15a545af2ed1e94256d2a0fe29
3
  size 305452744
runs/Nov21_02-34-07_ncgki16hjz/events.out.tfevents.1732156449.ncgki16hjz.205.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4d3920a7f74979318891a16ee96ad593565120771308c559a874f477c6ec299
3
+ size 5182
runs/Nov21_02-35-33_ncgki16hjz/events.out.tfevents.1732156534.ncgki16hjz.205.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:117a726ea6504ed4924f0a541d0986921f9d38c44eb30604f7d2f167c05bfeba
3
+ size 26136
tokenizer_config.json CHANGED
@@ -25,7 +25,7 @@
25
  "special": true
26
  }
27
  },
28
- "clean_up_tokenization_spaces": false,
29
  "eos_token": "</s>",
30
  "model_max_length": 512,
31
  "pad_token": "<pad>",
 
25
  "special": true
26
  }
27
  },
28
+ "clean_up_tokenization_spaces": true,
29
  "eos_token": "</s>",
30
  "model_max_length": 512,
31
  "pad_token": "<pad>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65d24f948d8bd5c43d55238c89b87846c3bc45c8c9cb75d128d4dc98318f25d6
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5311556afb3e79c7fd4cda661dce16faffba5d838a87824999817ae88082578
3
+ size 4792