vikash-walmart commited on
Commit
74d056b
1 Parent(s): e4cdec7

Training in progress, step 260

Browse files
adapter_config.json CHANGED
@@ -8,28 +8,34 @@
8
  "bias": "none",
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
- "init_lora_weights": "gaussian",
12
  "layer_replication": null,
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 8,
17
- "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
- "r": 8,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "o_proj",
27
  "down_proj",
 
28
  "gate_proj",
29
  "up_proj",
30
- "k_proj",
 
 
 
31
  "q_proj",
32
- "v_proj"
 
 
 
33
  ],
34
  "task_type": null,
35
  "use_dora": false,
 
8
  "bias": "none",
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
+ "init_lora_weights": true,
12
  "layer_replication": null,
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 16,
17
+ "lora_dropout": 0.0,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
+ "r": 64,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
26
  "down_proj",
27
+ "k_proj",
28
  "gate_proj",
29
  "up_proj",
30
+ "lm_head",
31
+ "fc1",
32
+ "out_proj",
33
+ "fc2",
34
  "q_proj",
35
+ "linear_1",
36
+ "linear_2",
37
+ "v_proj",
38
+ "o_proj"
39
  ],
40
  "task_type": null,
41
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2dd5babf6d24d0ca2ca40fa5c22a8e16fd033a11f57a04b89dd70606f8d3148
3
- size 86573968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4224dab146b0767daed913a68f976fe1805d35de6dc6fd90ceb735b27868bab
3
+ size 3003823256
runs/Oct17_13-18-37_instance-20241013-151046-finetune/events.out.tfevents.1729171121.instance-20241013-151046-finetune.2259592.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edbec5dd2e336f59af675634c9426561a797982a9724bf71274d43d839557d4e
3
+ size 18961
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3096d08840d5e028094f2f6f7ce798598eacb3ff42f6a5a30c1ef0e17b225a9
3
+ size 5560