Kevin Fink commited on
Commit
688891e
·
1 Parent(s): 440639a
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -55,7 +55,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
55
 
56
  # Set training arguments
57
  training_args = TrainingArguments(
58
- torch_empty_cache_steps=1000,
59
  overwrite_output_dir=True,
60
  output_dir='/data/results',
61
  eval_strategy="steps", # Change this to steps
@@ -71,12 +71,12 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
71
  metric_for_best_model="accuracy",
72
  greater_is_better=True,
73
  logging_dir='/data/logs',
74
- logging_steps=2000,
75
  #push_to_hub=True,
76
  hub_model_id=hub_id.strip(),
77
  fp16=True,
78
  #lr_scheduler_type='cosine',
79
- save_steps=2000, # Save checkpoint every 500 steps
80
  save_total_limit=3,
81
  )
82
  # Check if a checkpoint exists and load it
 
55
 
56
  # Set training arguments
57
  training_args = TrainingArguments(
58
+ torch_empty_cache_steps=100,
59
  overwrite_output_dir=True,
60
  output_dir='/data/results',
61
  eval_strategy="steps", # Change this to steps
 
71
  metric_for_best_model="accuracy",
72
  greater_is_better=True,
73
  logging_dir='/data/logs',
74
+ logging_steps=300,
75
  #push_to_hub=True,
76
  hub_model_id=hub_id.strip(),
77
  fp16=True,
78
  #lr_scheduler_type='cosine',
79
+ save_steps=300, # Save checkpoint every 500 steps
80
  save_total_limit=3,
81
  )
82
  # Check if a checkpoint exists and load it