Model save

Files changed (8) hide show

README.md CHANGED Viewed

@@ -38,6 +38,8 @@ The following hyperparameters were used during training:
 - eval_batch_size: 8
 - seed: 42
 - distributed_type: multi-GPU
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - num_epochs: 1

 - eval_batch_size: 8
 - seed: 42
 - distributed_type: multi-GPU
+- gradient_accumulation_steps: 128
+- total_train_batch_size: 512
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - num_epochs: 1

adapter_config.json CHANGED Viewed

@@ -17,8 +17,8 @@
   "revision": null,
   "target_modules": [
     "k_proj",
-    "q_proj",
     "o_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM"

   "revision": null,
   "target_modules": [
     "k_proj",
     "o_proj",
+    "q_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM"

runs/Feb01_05-47-09_r2d2-devbox-wmqsn/events.out.tfevents.1738388846.r2d2-devbox-wmqsn.24987.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:da26d08905c5c0f05bd0ef71055bcf815cd07a5cea9ab0ea1a3b3970c0383430
-size 4610

 version https://git-lfs.github.com/spec/v1
+oid sha256:d4afdab79fd69207f993dfcf392282861b9515a6b4362497c8ccaf42dc04cfba
+size 4764

runs/Feb01_05-54-49_r2d2-devbox-wmqsn/events.out.tfevents.1738389306.r2d2-devbox-wmqsn.27083.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e772613f767b5658dc13767309acbba14b874a99486e10574b7723636ae51375
+size 4612

step_0/README.md CHANGED Viewed

@@ -252,4 +252,11 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
 ### Framework versions
 - PEFT 0.6.1

 ### Framework versions
+- PEFT 0.6.1
+## Training procedure
+### Framework versions
 - PEFT 0.6.1

step_0/adapter_config.json CHANGED Viewed

@@ -17,8 +17,8 @@
   "revision": null,
   "target_modules": [
     "k_proj",
-    "q_proj",
     "o_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM"

   "revision": null,
   "target_modules": [
     "k_proj",
     "o_proj",
+    "q_proj",
     "v_proj"
   ],
   "task_type": "CAUSAL_LM"

step_0/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3f678c0eb7dbf508bb36eb2b09042f14e1f332a508923b35c640d3063d3a980a
 size 5816

 version https://git-lfs.github.com/spec/v1
+oid sha256:474709a6006c3092e509b34915c981e6f121c05a99366513abb5f1339867c2c0
 size 5816

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3f678c0eb7dbf508bb36eb2b09042f14e1f332a508923b35c640d3063d3a980a
 size 5816

 version https://git-lfs.github.com/spec/v1
+oid sha256:474709a6006c3092e509b34915c981e6f121c05a99366513abb5f1339867c2c0
 size 5816