jondurbin commited on
Commit
3f09a99
·
1 Parent(s): 7870f62

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -21,7 +21,7 @@ export WANDB_PROJECT=airoboros-mpt-30b-gpt4-1.4
21
  python qlora.py \
22
  --model_name_or_path ./mpt-30b \
23
  --output_dir ./$WANDB_PROJECT-checkpoints \
24
- --num_train_epochs 4 \
25
  --logging_steps 1 \
26
  --save_strategy steps \
27
  --data_seed 11422 \
@@ -48,7 +48,7 @@ python qlora.py \
48
  --model_max_len 8192 \
49
  --gradient_checkpointing \
50
  --per_device_train_batch_size 6 \
51
- --gradient_accumulation_steps 16 \
52
  --learning_rate 0.0001 \
53
  --adam_beta2 0.999 \
54
  --max_grad_norm 0.3 \
 
21
  python qlora.py \
22
  --model_name_or_path ./mpt-30b \
23
  --output_dir ./$WANDB_PROJECT-checkpoints \
24
+ --num_train_epochs 3 \
25
  --logging_steps 1 \
26
  --save_strategy steps \
27
  --data_seed 11422 \
 
48
  --model_max_len 8192 \
49
  --gradient_checkpointing \
50
  --per_device_train_batch_size 6 \
51
+ --gradient_accumulation_steps 1 \
52
  --learning_rate 0.0001 \
53
  --adam_beta2 0.999 \
54
  --max_grad_norm 0.3 \