HecklesL commited on
Commit
772f226
·
verified ·
1 Parent(s): fdbfbd3

Commit message

Browse files
Files changed (19) hide show
  1. README.md +2 -6
  2. adapter_config.json +2 -2
  3. adapter_model.safetensors +1 -1
  4. runs/Nov09_09-17-24_ip-10-192-12-219/events.out.tfevents.1731143845.ip-10-192-12-219.117549.0 +3 -0
  5. runs/Nov09_09-26-40_ip-10-192-12-219/events.out.tfevents.1731144401.ip-10-192-12-219.117549.1 +3 -0
  6. runs/Nov09_09-29-40_ip-10-192-12-219/events.out.tfevents.1731144580.ip-10-192-12-219.117549.2 +3 -0
  7. runs/Nov09_09-56-07_ip-10-192-12-219/events.out.tfevents.1731146169.ip-10-192-12-219.181121.0 +3 -0
  8. runs/Nov09_09-59-21_ip-10-192-12-219/events.out.tfevents.1731146362.ip-10-192-12-219.181121.1 +3 -0
  9. runs/Nov09_10-01-40_ip-10-192-12-219/events.out.tfevents.1731146501.ip-10-192-12-219.181121.2 +3 -0
  10. runs/Nov09_10-04-49_ip-10-192-12-219/events.out.tfevents.1731146690.ip-10-192-12-219.181121.3 +3 -0
  11. runs/Nov09_12-49-26_ip-10-192-11-134/events.out.tfevents.1731156569.ip-10-192-11-134.1666.0 +3 -0
  12. runs/Nov09_13-00-15_ip-10-192-11-134/events.out.tfevents.1731157217.ip-10-192-11-134.15162.0 +3 -0
  13. runs/Nov09_13-16-26_ip-10-192-11-134/events.out.tfevents.1731158189.ip-10-192-11-134.36325.0 +3 -0
  14. runs/Nov09_13-27-17_ip-10-192-11-134/events.out.tfevents.1731158839.ip-10-192-11-134.50779.0 +3 -0
  15. runs/Nov09_13-32-54_ip-10-192-11-134/events.out.tfevents.1731159177.ip-10-192-11-134.58325.0 +3 -0
  16. runs/Nov09_13-34-32_ip-10-192-11-134/events.out.tfevents.1731159274.ip-10-192-11-134.60568.0 +3 -0
  17. runs/Nov09_13-36-14_ip-10-192-11-134/events.out.tfevents.1731159377.ip-10-192-11-134.62817.0 +3 -0
  18. tokenizer.json +2 -2
  19. training_args.bin +2 -2
README.md CHANGED
@@ -41,19 +41,15 @@ The following hyperparameters were used during training:
41
  - seed: 42
42
  - gradient_accumulation_steps: 8
43
  - total_train_batch_size: 32
44
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: constant
46
  - lr_scheduler_warmup_ratio: 0.03
47
  - num_epochs: 3
48
 
49
- ### Training results
50
-
51
-
52
-
53
  ### Framework versions
54
 
55
  - PEFT 0.13.0
56
- - Transformers 4.45.1
57
  - Pytorch 2.4.0+cu121
58
  - Datasets 3.0.1
59
  - Tokenizers 0.20.1
 
41
  - seed: 42
42
  - gradient_accumulation_steps: 8
43
  - total_train_batch_size: 32
44
+ - optimizer: Use adamw_torch_fused with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
  - lr_scheduler_type: constant
46
  - lr_scheduler_warmup_ratio: 0.03
47
  - num_epochs: 3
48
 
 
 
 
 
49
  ### Framework versions
50
 
51
  - PEFT 0.13.0
52
+ - Transformers 4.46.2
53
  - Pytorch 2.4.0+cu121
54
  - Datasets 3.0.1
55
  - Tokenizers 0.20.1
adapter_config.json CHANGED
@@ -20,8 +20,8 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
- "v_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "v_proj",
24
+ "q_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8741ff58e846384e51fa9a378a18de184c89521547b1d0caab85522ae3289bfb
3
  size 23641256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d5c3fc263a5012355bc2a1c8e2701cbb93dbf7083de71e55f1cbd7f29349b46
3
  size 23641256
runs/Nov09_09-17-24_ip-10-192-12-219/events.out.tfevents.1731143845.ip-10-192-12-219.117549.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:623ae07bc0481d0d566fad78bdb85f89bc42948fcb7460fd1b8c907c21dd70d1
3
+ size 10346
runs/Nov09_09-26-40_ip-10-192-12-219/events.out.tfevents.1731144401.ip-10-192-12-219.117549.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57e50aa9bd50678162a4e3efa86de578ff330fdb18b4f9dd9846d13ca9fde254
3
+ size 6046
runs/Nov09_09-29-40_ip-10-192-12-219/events.out.tfevents.1731144580.ip-10-192-12-219.117549.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bec367eeb00b1a84f7139acc9a73bd0324483a88bc34848cce74955b8a2c820
3
+ size 6046
runs/Nov09_09-56-07_ip-10-192-12-219/events.out.tfevents.1731146169.ip-10-192-12-219.181121.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbc7ab9ccdd50f53b3053c32ba272e3baa94e961db378bc19bd41099f22eec53
3
+ size 6047
runs/Nov09_09-59-21_ip-10-192-12-219/events.out.tfevents.1731146362.ip-10-192-12-219.181121.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae452ac0c6c21dd29a2183b64a2cd9cf334079ba921a68518530053962a012b
3
+ size 6047
runs/Nov09_10-01-40_ip-10-192-12-219/events.out.tfevents.1731146501.ip-10-192-12-219.181121.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deba96ae93b77219b83597011f3ab8b0ee6d44e80985d59e8d0f2e41e120f8d9
3
+ size 6047
runs/Nov09_10-04-49_ip-10-192-12-219/events.out.tfevents.1731146690.ip-10-192-12-219.181121.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6018e412e2b46bfaaaf1017051231af23e88c08f011979f969ffa9d184839900
3
+ size 6047
runs/Nov09_12-49-26_ip-10-192-11-134/events.out.tfevents.1731156569.ip-10-192-11-134.1666.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd64045a4e9b750c2ffc4e49632d0700f13c8d6f909c1e48665945b52b50c381
3
+ size 6047
runs/Nov09_13-00-15_ip-10-192-11-134/events.out.tfevents.1731157217.ip-10-192-11-134.15162.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df5db4cfc1f979f5463c818909ad141658bf0fde38503dae5191a7af8d593f24
3
+ size 10346
runs/Nov09_13-16-26_ip-10-192-11-134/events.out.tfevents.1731158189.ip-10-192-11-134.36325.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efd8e9d1ad9a023ba2dc44044c39f6b014ff939b9329bfdac94eb4a776b1496b
3
+ size 10543
runs/Nov09_13-27-17_ip-10-192-11-134/events.out.tfevents.1731158839.ip-10-192-11-134.50779.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605bcf0f0466eb447092069065157b48f6e140ea12fff242547ba8f83cf6739e
3
+ size 10062
runs/Nov09_13-32-54_ip-10-192-11-134/events.out.tfevents.1731159177.ip-10-192-11-134.58325.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6374e83a43530f7bfb579e56b4ee8473a128d3e488765cab5a259c4063da414a
3
+ size 10062
runs/Nov09_13-34-32_ip-10-192-11-134/events.out.tfevents.1731159274.ip-10-192-11-134.60568.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdd2a5029f533d57e1fc3e32ba86ccfb5df60a1217c7a146ac6cdd1563169b93
3
+ size 10062
runs/Nov09_13-36-14_ip-10-192-11-134/events.out.tfevents.1731159377.ip-10-192-11-134.62817.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5781f84c5643d81e5d765b51dd151a9bc257922d754df75bf26d035cceb15748
3
+ size 10062
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abd08b46c9c01a903788030f36d9731aad064d0c420e66b88e3e143cda9e4e9a
3
- size 17210268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9816d43bd5347d64bccc66b7710947fb18e9818cc660215b1462061d4a44e449
3
+ size 17210088
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df12c48bb2cf17b1a8f19883545328ab580e1d7555de74620e2ec44f4949fea9
3
- size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:540974c06f0e6342b8a99442a23bb28a0c06f97ca9b94c689f0aa0dc07fcda2f
3
+ size 5624