Update README.md
Browse files
README.md
CHANGED
@@ -21,7 +21,7 @@ export WANDB_PROJECT=airoboros-mpt-30b-gpt4-1.4
|
|
21 |
python qlora.py \
|
22 |
--model_name_or_path ./mpt-30b \
|
23 |
--output_dir ./$WANDB_PROJECT-checkpoints \
|
24 |
-
--num_train_epochs
|
25 |
--logging_steps 1 \
|
26 |
--save_strategy steps \
|
27 |
--data_seed 11422 \
|
@@ -48,7 +48,7 @@ python qlora.py \
|
|
48 |
--model_max_len 8192 \
|
49 |
--gradient_checkpointing \
|
50 |
--per_device_train_batch_size 6 \
|
51 |
-
--gradient_accumulation_steps
|
52 |
--learning_rate 0.0001 \
|
53 |
--adam_beta2 0.999 \
|
54 |
--max_grad_norm 0.3 \
|
|
|
21 |
python qlora.py \
|
22 |
--model_name_or_path ./mpt-30b \
|
23 |
--output_dir ./$WANDB_PROJECT-checkpoints \
|
24 |
+
--num_train_epochs 3 \
|
25 |
--logging_steps 1 \
|
26 |
--save_strategy steps \
|
27 |
--data_seed 11422 \
|
|
|
48 |
--model_max_len 8192 \
|
49 |
--gradient_checkpointing \
|
50 |
--per_device_train_batch_size 6 \
|
51 |
+
--gradient_accumulation_steps 1 \
|
52 |
--learning_rate 0.0001 \
|
53 |
--adam_beta2 0.999 \
|
54 |
--max_grad_norm 0.3 \
|