lvcalucioli commited on
Commit
170f3a2
1 Parent(s): d50a6f5

llamantino7b_2_2_syntetic-question-answering

Browse files
README.md CHANGED
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: cosine
44
  - lr_scheduler_warmup_ratio: 0.03
45
- - num_epochs: 2
46
 
47
  ### Training results
48
 
 
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: cosine
44
  - lr_scheduler_warmup_ratio: 0.03
45
+ - num_epochs: 3
46
 
47
  ### Training results
48
 
adapter_config.json CHANGED
@@ -19,13 +19,13 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "gate_proj",
23
- "down_proj",
 
24
  "k_proj",
25
  "o_proj",
26
- "q_proj",
27
- "up_proj",
28
- "v_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_rslora": false
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "up_proj",
23
+ "q_proj",
24
+ "v_proj",
25
  "k_proj",
26
  "o_proj",
27
+ "down_proj",
28
+ "gate_proj"
 
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_rslora": false
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04a240d7b26be23b1810b6315b9fc0fe08cbe5e46b9eccd91284cdf505dab4b9
3
  size 639691872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9e091b11a047bc51d4d5608cde70f9359235138295222d4baa7b9a388dcd572
3
  size 639691872
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fcab6936f2b02d715e388fcca1a5f1f66396e4ea6e8b22d1df81fc3ac6e62b5
3
  size 4411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca2d84401ff09ae7196e4302d101b091763affdff18a759d3d22d09d7b087f3e
3
  size 4411