knlp
/

KS-SOLAR-10.7B-v0.1

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

knlp commited on Feb 14, 2024

Commit

647abae

·

verified ·

1 Parent(s): cf8a7d5

Update README.md

Files changed (1) hide show

README.md +12 -0

README.md CHANGED Viewed

@@ -16,23 +16,35 @@ Base Model: *upstage/SOLAR-10.7B-v1.0*
 ***hyper params I***
 batch_size : 16
 num_epochs : 1
 micro_batch : 1
 gradient_accumulation_steps : batch_size // micro_batch
 ***hyper params II***
 cutoff_len : 4096
 lr_scheduler : 'cosine'
 warmup_ratio : 0.06
 learning_rate : 4e-4
 optimizer : 'adamw_torch'
 weight_decay : 0.01
 max_grad_norm : 1.0
 ***LoRA config***
 lora_r : 64
 lora_alpha : 16
 lora_dropout : 0.05
 lora_target_modules : ["gate_proj", "down_proj", "up_proj"]

 ***hyper params I***
 batch_size : 16
 num_epochs : 1
 micro_batch : 1
 gradient_accumulation_steps : batch_size // micro_batch
 ***hyper params II***
 cutoff_len : 4096
 lr_scheduler : 'cosine'
 warmup_ratio : 0.06
 learning_rate : 4e-4
 optimizer : 'adamw_torch'
 weight_decay : 0.01
 max_grad_norm : 1.0
 ***LoRA config***
 lora_r : 64
 lora_alpha : 16
 lora_dropout : 0.05
 lora_target_modules : ["gate_proj", "down_proj", "up_proj"]