Commit
·
5911cb4
1
Parent(s):
b8acf0a
Upload 12 files
Browse files- AIRA_FineTuning.ipynb +0 -0
- Aira_emissions.csv +1 -1
- README.md +8 -8
- config.json +1 -1
- generation_config.json +1 -1
- pytorch_model.bin +1 -1
- training_stats.parquet +2 -2
AIRA_FineTuning.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
Aira_emissions.csv
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
2 |
-
2023-06-
|
|
|
1 |
timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
2 |
+
2023-06-26T20:59:10,Aira_emissions,11cacca9-3eab-40c7-b5f7-ddc76c5e63dd,3700.934177160263,0.19347784083149752,5.227810913944803e-05,42.5,300.033,31.30528450012207,0.043691478491657325,0.35160399291778927,0.03216577530459102,0.42746124671403773,United States,USA,iowa,,,Linux-5.15.107+-x86_64-with-glibc2.31,3.10.12,2.2.4,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,-95.8517,41.2591,83.48075866699219,machine,N,1.0
|
README.md
CHANGED
@@ -46,23 +46,23 @@ Check our gradio-demo in [Spaces](https://huggingface.co/spaces/nicholasKluge/Ai
|
|
46 |
|
47 |
## Details
|
48 |
|
49 |
-
- **Size:** 124,441,344
|
50 |
- **Dataset:** [Instruct-Aira Dataset](https://huggingface.co/datasets/nicholasKluge/fine-tuning-instruct-aira)
|
51 |
- **Language:** English
|
52 |
- **Number of Epochs:** 5
|
53 |
- **Batch size:** 32
|
54 |
- **Optimizer:** `torch.optim.AdamW` (warmup_steps = 1e2, learning_rate = 5e-4, epsilon = 1e-8)
|
55 |
- **GPU:** 1 NVIDIA A100-SXM4-40GB
|
56 |
-
- **Emissions:** 0.
|
57 |
-
- **Total Energy Consumption:** 0.
|
58 |
|
59 |
| Epoch|Training Loss|Validation Loss|
|
60 |
|---|---|---|
|
61 |
-
| 1 |1.
|
62 |
-
| 2 |0.
|
63 |
-
| 3 |0.
|
64 |
-
| 4 |0.
|
65 |
-
| 5 |0.
|
66 |
|
67 |
This repository has the notebook used to train this model.
|
68 |
|
|
|
46 |
|
47 |
## Details
|
48 |
|
49 |
+
- **Size:** 124,441,344 parameters
|
50 |
- **Dataset:** [Instruct-Aira Dataset](https://huggingface.co/datasets/nicholasKluge/fine-tuning-instruct-aira)
|
51 |
- **Language:** English
|
52 |
- **Number of Epochs:** 5
|
53 |
- **Batch size:** 32
|
54 |
- **Optimizer:** `torch.optim.AdamW` (warmup_steps = 1e2, learning_rate = 5e-4, epsilon = 1e-8)
|
55 |
- **GPU:** 1 NVIDIA A100-SXM4-40GB
|
56 |
+
- **Emissions:** 0.19 KgCO2 (United States of America)
|
57 |
+
- **Total Energy Consumption:** 0.42 kWh
|
58 |
|
59 |
| Epoch|Training Loss|Validation Loss|
|
60 |
|---|---|---|
|
61 |
+
| 1 |1.076073|0.692127|
|
62 |
+
| 2 |0.680394|0.662053|
|
63 |
+
| 3 |0.622054|0.651161|
|
64 |
+
| 4 |0.577170|0.644864|
|
65 |
+
| 5 |0.541509|0.644677|
|
66 |
|
67 |
This repository has the notebook used to train this model.
|
68 |
|
config.json
CHANGED
@@ -33,7 +33,7 @@
|
|
33 |
}
|
34 |
},
|
35 |
"torch_dtype": "float32",
|
36 |
-
"transformers_version": "4.30.
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 50259
|
39 |
}
|
|
|
33 |
}
|
34 |
},
|
35 |
"torch_dtype": "float32",
|
36 |
+
"transformers_version": "4.30.2",
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 50259
|
39 |
}
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 50256,
|
4 |
"eos_token_id": 50256,
|
5 |
-
"transformers_version": "4.30.
|
6 |
}
|
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 50256,
|
4 |
"eos_token_id": 50256,
|
5 |
+
"transformers_version": "4.30.2"
|
6 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 497813341
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:416747d3d9f13edd608e3bfb88cea796290ae21c9b9e293d8de518c8c18417af
|
3 |
size 497813341
|
training_stats.parquet
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27e940ad317c8e9f7d3eb1a1f223abef0d2ada8f5c0727d89d66121b856c6841
|
3 |
+
size 3110
|