jd3 / params.json
stojchet's picture
Upload params.json with huggingface_hub
0b77c85 verified
raw
history blame contribute delete
369 Bytes
{"base_model": "deepseek-ai/deepseek-coder-1.3b-base", "dataset_name": "stojchet/dpo-final_base_dataset", "dataset_size": 7500, "epochs": 5, "gradient_accumulation_steps": 64, "language": "java", "learning_rate": 1e-06, "lora_alpha": 16, "lora_dropout": 0.1, "lora_r": 64, "max_seq_length": 1000, "no_lora": true, "per_device_train_batch_size": 16, "weight_decay": 0.1}