Upload 10 files
#2
by
MounikaAithagoni
- opened
- Q1_Models Comparison.docx +0 -0
- Q2_Hyperparameters.docx +0 -0
- Q3_The evaluation strategy.docx +0 -0
- Q4_Google Translate Deployment.docx +0 -0
- Q5_training_curve_Phi_3_5_Arabic (2).csv +38 -0
- Q6_loss curve from the Phi-3.5-mini-instruct model.docx +0 -0
- Q7_Training_Arabic_and_English.ipynb +0 -0
- Q8_Evaluation_Arabic_and_English_Translator.ipynb +0 -0
- loss_curve_Phi_3_5_Arabic (4).png +0 -0
- training_curve_Phi_3_5_Arabic9.csv +38 -0
Q1_Models Comparison.docx
ADDED
Binary file (14.7 kB). View file
|
|
Q2_Hyperparameters.docx
ADDED
Binary file (13.1 kB). View file
|
|
Q3_The evaluation strategy.docx
ADDED
Binary file (23 kB). View file
|
|
Q4_Google Translate Deployment.docx
ADDED
Binary file (117 kB). View file
|
|
Q5_training_curve_Phi_3_5_Arabic (2).csv
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
loss,grad_norm,learning_rate,epoch,step,eval_loss,eval_runtime,eval_samples_per_second,eval_steps_per_second,train_runtime,train_samples_per_second,train_steps_per_second,total_flos,train_loss
|
2 |
+
1.2534,0.7888012528419495,4e-05,0.025,1,,,,,,,,,
|
3 |
+
1.6814,1.304793119430542,8e-05,0.05,2,,,,,,,,,
|
4 |
+
1.7566,1.2770837545394897,0.00012,0.075,3,,,,,,,,,
|
5 |
+
1.3991,0.9290549755096436,0.00016,0.1,4,,,,,,,,,
|
6 |
+
1.3387,0.8864096999168396,0.0002,0.125,5,,,,,,,,,
|
7 |
+
,,,0.125,5,1.0552338361740112,7.1909,11.125,1.391,,,,,
|
8 |
+
0.8119,0.3486979305744171,0.000192,0.15,6,,,,,,,,,
|
9 |
+
0.8837,0.46293407678604126,0.00018400000000000003,0.175,7,,,,,,,,,
|
10 |
+
0.6576,0.3244289755821228,0.00017600000000000002,0.2,8,,,,,,,,,
|
11 |
+
0.6484,0.2247825413942337,0.000168,0.225,9,,,,,,,,,
|
12 |
+
0.7436,0.4602418839931488,0.00016,0.25,10,,,,,,,,,
|
13 |
+
,,,0.25,10,0.725510835647583,4.8682,16.433,2.054,,,,,
|
14 |
+
0.7571,0.2589215636253357,0.000152,0.275,11,,,,,,,,,
|
15 |
+
0.9006,0.40398478507995605,0.000144,0.3,12,,,,,,,,,
|
16 |
+
0.5278,0.19507887959480286,0.00013600000000000003,0.325,13,,,,,,,,,
|
17 |
+
0.5557,0.20721735060214996,0.00012800000000000002,0.35,14,,,,,,,,,
|
18 |
+
0.5042,0.1408037394285202,0.00012,0.375,15,,,,,,,,,
|
19 |
+
,,,0.375,15,0.6471825242042542,4.8773,16.403,2.05,,,,,
|
20 |
+
0.6344,0.20234538614749908,0.00011200000000000001,0.4,16,,,,,,,,,
|
21 |
+
0.5956,0.28273141384124756,0.00010400000000000001,0.425,17,,,,,,,,,
|
22 |
+
0.6394,0.42618072032928467,9.6e-05,0.45,18,,,,,,,,,
|
23 |
+
0.6881,0.23107975721359253,8.800000000000001e-05,0.475,19,,,,,,,,,
|
24 |
+
0.5356,0.17914614081382751,8e-05,0.5,20,,,,,,,,,
|
25 |
+
,,,0.5,20,0.5898063778877258,4.8632,16.45,2.056,,,,,
|
26 |
+
0.5028,0.1842283010482788,7.2e-05,0.525,21,,,,,,,,,
|
27 |
+
0.4696,0.17058564722537994,6.400000000000001e-05,0.55,22,,,,,,,,,
|
28 |
+
0.6429,0.2980625331401825,5.6000000000000006e-05,0.575,23,,,,,,,,,
|
29 |
+
0.5543,0.2445172369480133,4.8e-05,0.6,24,,,,,,,,,
|
30 |
+
0.492,0.3871745765209198,4e-05,0.625,25,,,,,,,,,
|
31 |
+
,,,0.625,25,0.5556104779243469,4.8657,16.442,2.055,,,,,
|
32 |
+
0.4687,0.3489736318588257,3.2000000000000005e-05,0.65,26,,,,,,,,,
|
33 |
+
0.5499,0.18392369151115417,2.4e-05,0.675,27,,,,,,,,,
|
34 |
+
0.479,0.21796149015426636,1.6000000000000003e-05,0.7,28,,,,,,,,,
|
35 |
+
0.5323,0.2878962457180023,8.000000000000001e-06,0.725,29,,,,,,,,,
|
36 |
+
0.5485,0.22873283922672272,0.0,0.75,30,,,,,,,,,
|
37 |
+
,,,0.75,30,0.5422899127006531,4.8679,16.434,2.054,,,,,
|
38 |
+
,,,0.75,30,,,,,116.3306,2.063,0.258,2819390830755840.0,0.7584310283263525
|
Q6_loss curve from the Phi-3.5-mini-instruct model.docx
ADDED
Binary file (53.2 kB). View file
|
|
Q7_Training_Arabic_and_English.ipynb
ADDED
The diff for this file is too large to render.
See raw diff
|
|
Q8_Evaluation_Arabic_and_English_Translator.ipynb
ADDED
The diff for this file is too large to render.
See raw diff
|
|
loss_curve_Phi_3_5_Arabic (4).png
ADDED
training_curve_Phi_3_5_Arabic9.csv
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
loss,grad_norm,learning_rate,epoch,step,eval_loss,eval_runtime,eval_samples_per_second,eval_steps_per_second,train_runtime,train_samples_per_second,train_steps_per_second,total_flos,train_loss
|
2 |
+
1.2534,0.788801253,4.00E-05,0.025,1,,,,,,,,,
|
3 |
+
1.6814,1.304793119,8.00E-05,0.05,2,,,,,,,,,
|
4 |
+
1.7566,1.277083755,0.00012,0.075,3,,,,,,,,,
|
5 |
+
1.3991,0.929054976,0.00016,0.1,4,,,,,,,,,
|
6 |
+
1.3387,0.8864097,0.0002,0.125,5,,,,,,,,,
|
7 |
+
1.055233836,7.1909,,0.125,5,1.055233836,7.1909,11.125,1.391,,,,,
|
8 |
+
0.8119,0.348697931,0.000192,0.15,6,,,,,,,,,
|
9 |
+
0.8837,0.462934077,0.000184,0.175,7,,,,,,,,,
|
10 |
+
0.6576,0.324428976,0.000176,0.2,8,,,,,,,,,
|
11 |
+
0.6484,0.224782541,0.000168,0.225,9,,,,,,,,,
|
12 |
+
0.7436,0.460241884,0.00016,0.25,10,,,,,,,,,
|
13 |
+
0.725510836,4.8682,,0.25,10,0.725510836,4.8682,16.433,2.054,,,,,
|
14 |
+
0.7571,0.258921564,0.000152,0.275,11,,,,,,,,,
|
15 |
+
0.9006,0.403984785,0.000144,0.3,12,,,,,,,,,
|
16 |
+
0.5278,0.19507888,0.000136,0.325,13,,,,,,,,,
|
17 |
+
0.5557,0.207217351,0.000128,0.35,14,,,,,,,,,
|
18 |
+
0.5042,0.140803739,0.00012,0.375,15,,,,,,,,,
|
19 |
+
0.647182524,4.8773,,0.375,15,0.647182524,4.8773,16.403,2.05,,,,,
|
20 |
+
0.6344,0.202345386,0.000112,0.4,16,,,,,,,,,
|
21 |
+
0.5956,0.282731414,0.000104,0.425,17,,,,,,,,,
|
22 |
+
0.6394,0.42618072,9.60E-05,0.45,18,,,,,,,,,
|
23 |
+
0.6881,0.231079757,8.80E-05,0.475,19,,,,,,,,,
|
24 |
+
0.5356,0.179146141,8.00E-05,0.5,20,,,,,,,,,
|
25 |
+
0.589806378,4.8632,,0.5,20,0.589806378,4.8632,16.45,2.056,,,,,
|
26 |
+
0.5028,0.184228301,7.20E-05,0.525,21,,,,,,,,,
|
27 |
+
0.4696,0.170585647,6.40E-05,0.55,22,,,,,,,,,
|
28 |
+
0.6429,0.298062533,5.60E-05,0.575,23,,,,,,,,,
|
29 |
+
0.5543,0.244517237,4.80E-05,0.6,24,,,,,,,,,
|
30 |
+
0.492,0.387174577,4.00E-05,0.625,25,,,,,,,,,
|
31 |
+
0.555610478,4.8657,,0.625,25,0.555610478,4.8657,16.442,2.055,,,,,
|
32 |
+
0.4687,0.348973632,3.20E-05,0.65,26,,,,,,,,,
|
33 |
+
0.5499,0.183923692,2.40E-05,0.675,27,,,,,,,,,
|
34 |
+
0.479,0.21796149,1.60E-05,0.7,28,,,,,,,,,
|
35 |
+
0.5323,0.287896246,8.00E-06,0.725,29,,,,,,,,,
|
36 |
+
0.5485,0.228732839,0,0.75,30,,,,,,,,,
|
37 |
+
,,,0.75,30,0.542289913,4.8679,16.434,2.054,,,,,
|
38 |
+
,,,0.75,30,,,,,116.3306,2.063,0.258,2.81939E+15,0.758431028
|