tomtseng commited on
Commit
280e720
·
verified ·
1 Parent(s): 86870d9

Model save

Browse files
README.md CHANGED
@@ -38,6 +38,8 @@ The following hyperparameters were used during training:
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - distributed_type: multi-GPU
 
 
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: cosine
43
  - num_epochs: 1
 
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - distributed_type: multi-GPU
41
+ - gradient_accumulation_steps: 128
42
+ - total_train_batch_size: 512
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: cosine
45
  - num_epochs: 1
adapter_config.json CHANGED
@@ -17,8 +17,8 @@
17
  "revision": null,
18
  "target_modules": [
19
  "k_proj",
20
- "q_proj",
21
  "o_proj",
 
22
  "v_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
 
17
  "revision": null,
18
  "target_modules": [
19
  "k_proj",
 
20
  "o_proj",
21
+ "q_proj",
22
  "v_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
runs/Feb01_05-47-09_r2d2-devbox-wmqsn/events.out.tfevents.1738388846.r2d2-devbox-wmqsn.24987.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da26d08905c5c0f05bd0ef71055bcf815cd07a5cea9ab0ea1a3b3970c0383430
3
- size 4610
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4afdab79fd69207f993dfcf392282861b9515a6b4362497c8ccaf42dc04cfba
3
+ size 4764
runs/Feb01_05-54-49_r2d2-devbox-wmqsn/events.out.tfevents.1738389306.r2d2-devbox-wmqsn.27083.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e772613f767b5658dc13767309acbba14b874a99486e10574b7723636ae51375
3
+ size 4612
step_0/README.md CHANGED
@@ -252,4 +252,11 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
252
  ### Framework versions
253
 
254
 
 
 
 
 
 
 
 
255
  - PEFT 0.6.1
 
252
  ### Framework versions
253
 
254
 
255
+ - PEFT 0.6.1
256
+ ## Training procedure
257
+
258
+
259
+ ### Framework versions
260
+
261
+
262
  - PEFT 0.6.1
step_0/adapter_config.json CHANGED
@@ -17,8 +17,8 @@
17
  "revision": null,
18
  "target_modules": [
19
  "k_proj",
20
- "q_proj",
21
  "o_proj",
 
22
  "v_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
 
17
  "revision": null,
18
  "target_modules": [
19
  "k_proj",
 
20
  "o_proj",
21
+ "q_proj",
22
  "v_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
step_0/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f678c0eb7dbf508bb36eb2b09042f14e1f332a508923b35c640d3063d3a980a
3
  size 5816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474709a6006c3092e509b34915c981e6f121c05a99366513abb5f1339867c2c0
3
  size 5816
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f678c0eb7dbf508bb36eb2b09042f14e1f332a508923b35c640d3063d3a980a
3
  size 5816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474709a6006c3092e509b34915c981e6f121c05a99366513abb5f1339867c2c0
3
  size 5816