elijah0430 commited on
Commit
d50c128
·
1 Parent(s): 600ec85

Upload model

Browse files
Files changed (3) hide show
  1. README.md +4 -5
  2. adapter_config.json +3 -0
  3. adapter_model.safetensors +1 -1
README.md CHANGED
@@ -18,6 +18,7 @@ base_model: beomi/polyglot-ko-12.8b-safetensors
18
 
19
 
20
  - **Developed by:** [More Information Needed]
 
21
  - **Shared by [optional]:** [More Information Needed]
22
  - **Model type:** [More Information Needed]
23
  - **Language(s) (NLP):** [More Information Needed]
@@ -76,7 +77,7 @@ Use the code below to get started with the model.
76
 
77
  ### Training Data
78
 
79
- <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
 
81
  [More Information Needed]
82
 
@@ -107,7 +108,7 @@ Use the code below to get started with the model.
107
 
108
  #### Testing Data
109
 
110
- <!-- This should link to a Data Card if possible. -->
111
 
112
  [More Information Needed]
113
 
@@ -200,7 +201,6 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
200
 
201
  ## Training procedure
202
 
203
-
204
  The following `bitsandbytes` quantization config was used during training:
205
  - quant_method: bitsandbytes
206
  - load_in_8bit: False
@@ -215,5 +215,4 @@ The following `bitsandbytes` quantization config was used during training:
215
 
216
  ### Framework versions
217
 
218
-
219
- - PEFT 0.6.2.dev0
 
18
 
19
 
20
  - **Developed by:** [More Information Needed]
21
+ - **Funded by [optional]:** [More Information Needed]
22
  - **Shared by [optional]:** [More Information Needed]
23
  - **Model type:** [More Information Needed]
24
  - **Language(s) (NLP):** [More Information Needed]
 
77
 
78
  ### Training Data
79
 
80
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
81
 
82
  [More Information Needed]
83
 
 
108
 
109
  #### Testing Data
110
 
111
+ <!-- This should link to a Dataset Card if possible. -->
112
 
113
  [More Information Needed]
114
 
 
201
 
202
  ## Training procedure
203
 
 
204
  The following `bitsandbytes` quantization config was used during training:
205
  - quant_method: bitsandbytes
206
  - load_in_8bit: False
 
215
 
216
  ### Framework versions
217
 
218
+ - PEFT 0.6.3.dev0
 
adapter_config.json CHANGED
@@ -8,8 +8,11 @@
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
 
11
  "lora_alpha": 32,
12
  "lora_dropout": 0.05,
 
 
13
  "modules_to_save": null,
14
  "peft_type": "LORA",
15
  "r": 8,
 
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
+ "loftq_config": {},
12
  "lora_alpha": 32,
13
  "lora_dropout": 0.05,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
  "r": 8,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8652068b48cb207dac8788fc697c5a7e1b1b0b2dda5115f0d8f4dc9109ac5069
3
  size 26226072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee020b79a72e6fa134c3c14fb51c91727aadeaae7d144a765f067fc9eee2efe7
3
  size 26226072