nicholasKluge commited on
Commit
5911cb4
·
1 Parent(s): b8acf0a

Upload 12 files

Browse files
AIRA_FineTuning.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
Aira_emissions.csv CHANGED
@@ -1,2 +1,2 @@
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
- 2023-06-11T00:44:09,Aira_emissions,cf6bd6e6-4983-41ba-b2a3-bea0e4ca0a1b,4011.559634208679,0.15083361627850095,3.7599744247165954e-05,42.5,343.846,31.30528450012207,0.04735859059956342,0.37325643035497413,0.034865123505880974,0.4554801444604184,Netherlands,NLD,groningen,,,Linux-5.15.107+-x86_64-with-glibc2.31,3.10.12,2.2.3,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,6.5765,53.2157,83.48075866699219,machine,N,1.0
 
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
+ 2023-06-26T20:59:10,Aira_emissions,11cacca9-3eab-40c7-b5f7-ddc76c5e63dd,3700.934177160263,0.19347784083149752,5.227810913944803e-05,42.5,300.033,31.30528450012207,0.043691478491657325,0.35160399291778927,0.03216577530459102,0.42746124671403773,United States,USA,iowa,,,Linux-5.15.107+-x86_64-with-glibc2.31,3.10.12,2.2.4,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,-95.8517,41.2591,83.48075866699219,machine,N,1.0
README.md CHANGED
@@ -46,23 +46,23 @@ Check our gradio-demo in [Spaces](https://huggingface.co/spaces/nicholasKluge/Ai
46
 
47
  ## Details
48
 
49
- - **Size:** 124,441,344 total parameters
50
  - **Dataset:** [Instruct-Aira Dataset](https://huggingface.co/datasets/nicholasKluge/fine-tuning-instruct-aira)
51
  - **Language:** English
52
  - **Number of Epochs:** 5
53
  - **Batch size:** 32
54
  - **Optimizer:** `torch.optim.AdamW` (warmup_steps = 1e2, learning_rate = 5e-4, epsilon = 1e-8)
55
  - **GPU:** 1 NVIDIA A100-SXM4-40GB
56
- - **Emissions:** 0.15 KgCO2 (Netherlands)
57
- - **Total Energy Consumption:** 0.45 kWh
58
 
59
  | Epoch|Training Loss|Validation Loss|
60
  |---|---|---|
61
- | 1 |1.052499|0.673275|
62
- | 2 |0.675395|0.642822|
63
- | 3 |0.616321|0.630550|
64
- | 4 |0.571597|0.626158|
65
- | 5 |0.534876|0.626929|
66
 
67
  This repository has the notebook used to train this model.
68
 
 
46
 
47
  ## Details
48
 
49
+ - **Size:** 124,441,344 parameters
50
  - **Dataset:** [Instruct-Aira Dataset](https://huggingface.co/datasets/nicholasKluge/fine-tuning-instruct-aira)
51
  - **Language:** English
52
  - **Number of Epochs:** 5
53
  - **Batch size:** 32
54
  - **Optimizer:** `torch.optim.AdamW` (warmup_steps = 1e2, learning_rate = 5e-4, epsilon = 1e-8)
55
  - **GPU:** 1 NVIDIA A100-SXM4-40GB
56
+ - **Emissions:** 0.19 KgCO2 (United States of America)
57
+ - **Total Energy Consumption:** 0.42 kWh
58
 
59
  | Epoch|Training Loss|Validation Loss|
60
  |---|---|---|
61
+ | 1 |1.076073|0.692127|
62
+ | 2 |0.680394|0.662053|
63
+ | 3 |0.622054|0.651161|
64
+ | 4 |0.577170|0.644864|
65
+ | 5 |0.541509|0.644677|
66
 
67
  This repository has the notebook used to train this model.
68
 
config.json CHANGED
@@ -33,7 +33,7 @@
33
  }
34
  },
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.30.1",
37
  "use_cache": true,
38
  "vocab_size": 50259
39
  }
 
33
  }
34
  },
35
  "torch_dtype": "float32",
36
+ "transformers_version": "4.30.2",
37
  "use_cache": true,
38
  "vocab_size": 50259
39
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
4
  "eos_token_id": 50256,
5
- "transformers_version": "4.30.1"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
4
  "eos_token_id": 50256,
5
+ "transformers_version": "4.30.2"
6
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a2f23a7600d9708d6a3069758ca7b39d82a7ce5a5dc4c345ccb3dd11cd595f4
3
  size 497813341
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:416747d3d9f13edd608e3bfb88cea796290ae21c9b9e293d8de518c8c18417af
3
  size 497813341
training_stats.parquet CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6c3c8c2cdbfe807189e35c2da55e34d3990074e40da1306cebbff9f0edba42a
3
- size 3108
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27e940ad317c8e9f7d3eb1a1f223abef0d2ada8f5c0727d89d66121b856c6841
3
+ size 3110