ELhadratiOth commited on
Commit
4e7b23b
·
verified ·
1 Parent(s): e0f7cba

End of training

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # models
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # models
18
 
19
+ This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct) on the darija_finetune_train dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 10.0,
3
  "eval_darija_finetune_val_loss": 1.6740385293960571,
4
- "eval_darija_finetune_val_runtime": 248.529,
5
- "eval_darija_finetune_val_samples_per_second": 4.024,
6
- "eval_darija_finetune_val_steps_per_second": 2.012,
7
  "total_flos": 2.3021942645089894e+17,
8
  "train_loss": 0.0,
9
- "train_runtime": 2.5784,
10
- "train_samples_per_second": 46541.284,
11
- "train_steps_per_second": 5817.66
12
  }
 
1
  {
2
  "epoch": 10.0,
3
  "eval_darija_finetune_val_loss": 1.6740385293960571,
4
+ "eval_darija_finetune_val_runtime": 247.6047,
5
+ "eval_darija_finetune_val_samples_per_second": 4.039,
6
+ "eval_darija_finetune_val_steps_per_second": 2.019,
7
  "total_flos": 2.3021942645089894e+17,
8
  "train_loss": 0.0,
9
+ "train_runtime": 1.1327,
10
+ "train_samples_per_second": 105944.302,
11
+ "train_steps_per_second": 13243.038
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 10.0,
3
  "eval_darija_finetune_val_loss": 1.6740385293960571,
4
- "eval_darija_finetune_val_runtime": 248.529,
5
- "eval_darija_finetune_val_samples_per_second": 4.024,
6
- "eval_darija_finetune_val_steps_per_second": 2.012
7
  }
 
1
  {
2
  "epoch": 10.0,
3
  "eval_darija_finetune_val_loss": 1.6740385293960571,
4
+ "eval_darija_finetune_val_runtime": 247.6047,
5
+ "eval_darija_finetune_val_samples_per_second": 4.039,
6
+ "eval_darija_finetune_val_steps_per_second": 2.019
7
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 10.0,
3
  "total_flos": 2.3021942645089894e+17,
4
  "train_loss": 0.0,
5
- "train_runtime": 2.5784,
6
- "train_samples_per_second": 46541.284,
7
- "train_steps_per_second": 5817.66
8
  }
 
2
  "epoch": 10.0,
3
  "total_flos": 2.3021942645089894e+17,
4
  "train_loss": 0.0,
5
+ "train_runtime": 1.1327,
6
+ "train_samples_per_second": 105944.302,
7
+ "train_steps_per_second": 13243.038
8
  }
trainer_state.json CHANGED
@@ -11713,9 +11713,9 @@
11713
  "step": 15000,
11714
  "total_flos": 2.3021942645089894e+17,
11715
  "train_loss": 0.0,
11716
- "train_runtime": 2.5784,
11717
- "train_samples_per_second": 46541.284,
11718
- "train_steps_per_second": 5817.66
11719
  }
11720
  ],
11721
  "logging_steps": 10,
 
11713
  "step": 15000,
11714
  "total_flos": 2.3021942645089894e+17,
11715
  "train_loss": 0.0,
11716
+ "train_runtime": 1.1327,
11717
+ "train_samples_per_second": 105944.302,
11718
+ "train_steps_per_second": 13243.038
11719
  }
11720
  ],
11721
  "logging_steps": 10,