Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint-1050/adapter_model/README.md +34 -0
- checkpoint-1050/adapter_model/adapter_config.json +26 -0
- checkpoint-1050/adapter_model/adapter_model.bin +3 -0
- checkpoint-1125/adapter_model/README.md +50 -0
- checkpoint-1125/adapter_model/adapter_config.json +26 -0
- checkpoint-1125/adapter_model/adapter_model.bin +3 -0
- checkpoint-1200/adapter_model/README.md +47 -0
- checkpoint-1200/adapter_model/adapter_config.json +26 -0
- checkpoint-1200/adapter_model/adapter_model.bin +3 -0
- checkpoint-1275/adapter_model/README.md +34 -0
- checkpoint-1275/adapter_model/adapter_config.json +26 -0
- checkpoint-1275/adapter_model/adapter_model.bin +3 -0
- checkpoint-1350/adapter_model/README.md +47 -0
- checkpoint-1350/adapter_model/adapter_config.json +26 -0
- checkpoint-1350/adapter_model/adapter_model.bin +3 -0
- checkpoint-1353/adapter_model/README.md +22 -0
- checkpoint-1353/adapter_model/adapter_config.json +26 -0
- checkpoint-1353/adapter_model/adapter_model.bin +3 -0
- checkpoint-225/adapter_model/README.md +47 -0
- checkpoint-225/adapter_model/adapter_config.json +26 -0
- checkpoint-225/adapter_model/adapter_model.bin +3 -0
- checkpoint-300/adapter_model/README.md +50 -0
- checkpoint-300/adapter_model/adapter_config.json +26 -0
- checkpoint-300/adapter_model/adapter_model.bin +3 -0
- checkpoint-375/adapter_model/README.md +50 -0
- checkpoint-375/adapter_model/adapter_config.json +26 -0
- checkpoint-375/adapter_model/adapter_model.bin +3 -0
- checkpoint-450/adapter_model/README.md +34 -0
- checkpoint-450/adapter_model/adapter_config.json +26 -0
- checkpoint-450/adapter_model/adapter_model.bin +3 -0
- checkpoint-525/adapter_model/README.md +51 -0
- checkpoint-525/adapter_model/adapter_config.json +26 -0
- checkpoint-525/adapter_model/adapter_model.bin +3 -0
- checkpoint-600/adapter_model/README.md +47 -0
- checkpoint-600/adapter_model/adapter_config.json +26 -0
- checkpoint-600/adapter_model/adapter_model.bin +3 -0
- checkpoint-675/adapter_model/README.md +0 -0
- checkpoint-675/adapter_model/adapter_config.json +26 -0
- checkpoint-675/adapter_model/adapter_model.bin +3 -0
- checkpoint-750/adapter_model/README.md +47 -0
- checkpoint-750/adapter_model/adapter_config.json +26 -0
- checkpoint-750/adapter_model/adapter_model.bin +3 -0
- checkpoint-825/adapter_model/README.md +34 -0
- checkpoint-825/adapter_model/adapter_config.json +26 -0
- checkpoint-825/adapter_model/adapter_model.bin +3 -0
- checkpoint-900/adapter_model/README.md +50 -0
- checkpoint-900/adapter_model/adapter_config.json +26 -0
- checkpoint-900/adapter_model/adapter_model.bin +3 -0
- checkpoint-975/adapter_model/README.md +50 -0
- checkpoint-975/adapter_model/adapter_config.json +26 -0
checkpoint-1050/adapter_model/README.md
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
checkpoint-1050/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1050/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e215a0530e59323730c42bf159ebde34d82f9124371a99938fd7349c7473ad3
|
3 |
+
size 1742976394
|
checkpoint-1125/adapter_model/README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
35 |
+
ing `bitsandbytes` quantization config was used during training:
|
36 |
+
- quant_method: bitsandbytes
|
37 |
+
- load_in_8bit: False
|
38 |
+
- load_in_4bit: True
|
39 |
+
- llm_int8_threshold: 6.0
|
40 |
+
- llm_int8_skip_modules: None
|
41 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
42 |
+
- llm_int8_has_fp16_weight: False
|
43 |
+
- bnb_4bit_quant_type: nf4
|
44 |
+
- bnb_4bit_use_double_quant: True
|
45 |
+
- bnb_4bit_compute_dtype: bfloat16
|
46 |
+
### Framework versions
|
47 |
+
|
48 |
+
- PEFT 0.4.0
|
49 |
+
|
50 |
+
- PEFT 0.4.0
|
checkpoint-1125/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1125/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a4d4bac811251a6c6ed61c30aa4802b88ca7dd50f831ecf6fc2e7ceeee1297c
|
3 |
+
size 1742976394
|
checkpoint-1200/adapter_model/README.md
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
checkpoint-1200/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1200/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7d5aa554ab1cb5115e63f6be3c5d7a41de170c336ed2e280fdbd713694c602c
|
3 |
+
size 1742976394
|
checkpoint-1275/adapter_model/README.md
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
checkpoint-1275/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1275/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fb6bcb2789dcaf7ee7a0941964b94061afe631dbaf4665feb5bd52dfad58018
|
3 |
+
size 1742976394
|
checkpoint-1350/adapter_model/README.md
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
checkpoint-1350/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1350/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:814d998d72074a5f71765d9031d68d1e3f46efa90589332414e74442f86901bb
|
3 |
+
size 1742976394
|
checkpoint-1353/adapter_model/README.md
ADDED
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
## Training procedure
|
2 |
+
|
3 |
+
|
4 |
+
The following `bitsandbytes` quantization config was used during training:
|
5 |
+
- quant_method: bitsandbytes
|
6 |
+
- load_in_8bit: False
|
7 |
+
- load_in_4bit: True
|
8 |
+
- llm_int8_threshold: 6.0
|
9 |
+
- llm_int8_skip_modules: None
|
10 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
11 |
+
- llm_int8_has_fp16_weight: False
|
12 |
+
- bnb_4bit_quant_type: nf4
|
13 |
+
- bnb_4bit_use_double_quant: True
|
14 |
+
- bnb_4bit_compute_dtype: bfloat16
|
15 |
+
### Framework versions
|
16 |
+
|
17 |
+
|
18 |
+
- PEFT 0.4.0
|
19 |
+
rk versions
|
20 |
+
|
21 |
+
|
22 |
+
- PEFT 0.4.0
|
checkpoint-1353/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"up_proj",
|
18 |
+
"gate_proj",
|
19 |
+
"v_proj",
|
20 |
+
"q_proj",
|
21 |
+
"down_proj",
|
22 |
+
"o_proj",
|
23 |
+
"k_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-1353/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bca5447a82f25ecc557959787df52f2ac0ffa74c2ee5097065ca392ff8be3b17
|
3 |
+
size 1742976394
|
checkpoint-225/adapter_model/README.md
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
checkpoint-225/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-225/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58bfd15c54cd3b129aa0a9713853da70e9f8e7db78b5993a0b181f3f9b1e4ef9
|
3 |
+
size 1742976394
|
checkpoint-300/adapter_model/README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
35 |
+
ing `bitsandbytes` quantization config was used during training:
|
36 |
+
- quant_method: bitsandbytes
|
37 |
+
- load_in_8bit: False
|
38 |
+
- load_in_4bit: True
|
39 |
+
- llm_int8_threshold: 6.0
|
40 |
+
- llm_int8_skip_modules: None
|
41 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
42 |
+
- llm_int8_has_fp16_weight: False
|
43 |
+
- bnb_4bit_quant_type: nf4
|
44 |
+
- bnb_4bit_use_double_quant: True
|
45 |
+
- bnb_4bit_compute_dtype: bfloat16
|
46 |
+
### Framework versions
|
47 |
+
|
48 |
+
- PEFT 0.4.0
|
49 |
+
|
50 |
+
- PEFT 0.4.0
|
checkpoint-300/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-300/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b12b8826464636147fcd84a41896630ebed25c69fc9ad75549e99b868c0a37b
|
3 |
+
size 1742976394
|
checkpoint-375/adapter_model/README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
35 |
+
ing `bitsandbytes` quantization config was used during training:
|
36 |
+
- quant_method: bitsandbytes
|
37 |
+
- load_in_8bit: False
|
38 |
+
- load_in_4bit: True
|
39 |
+
- llm_int8_threshold: 6.0
|
40 |
+
- llm_int8_skip_modules: None
|
41 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
42 |
+
- llm_int8_has_fp16_weight: False
|
43 |
+
- bnb_4bit_quant_type: nf4
|
44 |
+
- bnb_4bit_use_double_quant: True
|
45 |
+
- bnb_4bit_compute_dtype: bfloat16
|
46 |
+
### Framework versions
|
47 |
+
|
48 |
+
- PEFT 0.4.0
|
49 |
+
|
50 |
+
- PEFT 0.4.0
|
checkpoint-375/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-375/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2de322e76acd96d6ec5d4cf90230ec24d897a39a1d8b968245f3c17ffb1f1d56
|
3 |
+
size 1742976394
|
checkpoint-450/adapter_model/README.md
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
checkpoint-450/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-450/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc6c85a3ef343c9f388e4f65c8a1c2fd88414e1f0f242ff487b715f6dac88375
|
3 |
+
size 1742976394
|
checkpoint-525/adapter_model/README.md
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
48 |
+
rk versions
|
49 |
+
|
50 |
+
|
51 |
+
- PEFT 0.4.0
|
checkpoint-525/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-525/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44c770157f5696e256cea6286ed23173cd91fd4eb632456d26bbacb49e9a1564
|
3 |
+
size 1742976394
|
checkpoint-600/adapter_model/README.md
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
checkpoint-600/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-600/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e9d314bbec2de58c8dee041c9f49dd68ee46e466639f37c587e3ea319066a3f
|
3 |
+
size 1742976394
|
checkpoint-675/adapter_model/README.md
ADDED
Binary file (1.34 kB). View file
|
|
checkpoint-675/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-675/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1bede31f7fc266f4b61fe4efb7ffc881a1a966a922b2d1535d6958932d68858
|
3 |
+
size 1742976394
|
checkpoint-750/adapter_model/README.md
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
|
31 |
+
The following `bitsandbytes` quantization config was used during training:
|
32 |
+
- quant_method: bitsandbytes
|
33 |
+
- load_in_8bit: False
|
34 |
+
- load_in_4bit: True
|
35 |
+
- llm_int8_threshold: 6.0
|
36 |
+
- llm_int8_skip_modules: None
|
37 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
38 |
+
- llm_int8_has_fp16_weight: False
|
39 |
+
- bnb_4bit_quant_type: nf4
|
40 |
+
- bnb_4bit_use_double_quant: True
|
41 |
+
- bnb_4bit_compute_dtype: bfloat16
|
42 |
+
### Framework versions
|
43 |
+
|
44 |
+
- PEFT 0.4.0
|
45 |
+
- PEFT 0.4.0
|
46 |
+
|
47 |
+
- PEFT 0.4.0
|
checkpoint-750/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-750/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9608ed5e3c72ffc6c2eedea9d060f00bc1a8eab24a562138eebfe1a3d019390e
|
3 |
+
size 1742976394
|
checkpoint-825/adapter_model/README.md
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
checkpoint-825/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-825/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:672734526e8a94b3144e2c08e92776f0b79ad0fa5f146e84f0354a0b2b07dda2
|
3 |
+
size 1742976394
|
checkpoint-900/adapter_model/README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
35 |
+
ing `bitsandbytes` quantization config was used during training:
|
36 |
+
- quant_method: bitsandbytes
|
37 |
+
- load_in_8bit: False
|
38 |
+
- load_in_4bit: True
|
39 |
+
- llm_int8_threshold: 6.0
|
40 |
+
- llm_int8_skip_modules: None
|
41 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
42 |
+
- llm_int8_has_fp16_weight: False
|
43 |
+
- bnb_4bit_quant_type: nf4
|
44 |
+
- bnb_4bit_use_double_quant: True
|
45 |
+
- bnb_4bit_compute_dtype: bfloat16
|
46 |
+
### Framework versions
|
47 |
+
|
48 |
+
- PEFT 0.4.0
|
49 |
+
|
50 |
+
- PEFT 0.4.0
|
checkpoint-900/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|
checkpoint-900/adapter_model/adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c559b72b363f2977ba485cad04fcaee2b7505facb177e3b317fc94d78df86fca
|
3 |
+
size 1742976394
|
checkpoint-975/adapter_model/README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
---
|
4 |
+
## Training procedure
|
5 |
+
|
6 |
+
|
7 |
+
The following `bitsandbytes` quantization config was used during training:
|
8 |
+
- quant_method: bitsandbytes
|
9 |
+
- load_in_8bit: False
|
10 |
+
- load_in_4bit: True
|
11 |
+
- llm_int8_threshold: 6.0
|
12 |
+
- llm_int8_skip_modules: None
|
13 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
14 |
+
- llm_int8_has_fp16_weight: False
|
15 |
+
- bnb_4bit_quant_type: nf4
|
16 |
+
- bnb_4bit_use_double_quant: True
|
17 |
+
- bnb_4bit_compute_dtype: bfloat16
|
18 |
+
|
19 |
+
The following `bitsandbytes` quantization config was used during training:
|
20 |
+
- quant_method: bitsandbytes
|
21 |
+
- load_in_8bit: False
|
22 |
+
- load_in_4bit: True
|
23 |
+
- llm_int8_threshold: 6.0
|
24 |
+
- llm_int8_skip_modules: None
|
25 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
26 |
+
- llm_int8_has_fp16_weight: False
|
27 |
+
- bnb_4bit_quant_type: nf4
|
28 |
+
- bnb_4bit_use_double_quant: True
|
29 |
+
- bnb_4bit_compute_dtype: bfloat16
|
30 |
+
### Framework versions
|
31 |
+
|
32 |
+
- PEFT 0.4.0
|
33 |
+
|
34 |
+
- PEFT 0.4.0
|
35 |
+
ing `bitsandbytes` quantization config was used during training:
|
36 |
+
- quant_method: bitsandbytes
|
37 |
+
- load_in_8bit: False
|
38 |
+
- load_in_4bit: True
|
39 |
+
- llm_int8_threshold: 6.0
|
40 |
+
- llm_int8_skip_modules: None
|
41 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
42 |
+
- llm_int8_has_fp16_weight: False
|
43 |
+
- bnb_4bit_quant_type: nf4
|
44 |
+
- bnb_4bit_use_double_quant: True
|
45 |
+
- bnb_4bit_compute_dtype: bfloat16
|
46 |
+
### Framework versions
|
47 |
+
|
48 |
+
- PEFT 0.4.0
|
49 |
+
|
50 |
+
- PEFT 0.4.0
|
checkpoint-975/adapter_model/adapter_config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "/workspace/codellama-34b-hf",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 16.0,
|
11 |
+
"lora_dropout": 0.03,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 64,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"v_proj",
|
18 |
+
"up_proj",
|
19 |
+
"k_proj",
|
20 |
+
"down_proj",
|
21 |
+
"gate_proj",
|
22 |
+
"q_proj",
|
23 |
+
"o_proj"
|
24 |
+
],
|
25 |
+
"task_type": "CAUSAL_LM"
|
26 |
+
}
|