Kevin Fink
commited on
Commit
·
688891e
1
Parent(s):
440639a
dev
Browse files
app.py
CHANGED
@@ -55,7 +55,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
|
|
55 |
|
56 |
# Set training arguments
|
57 |
training_args = TrainingArguments(
|
58 |
-
torch_empty_cache_steps=
|
59 |
overwrite_output_dir=True,
|
60 |
output_dir='/data/results',
|
61 |
eval_strategy="steps", # Change this to steps
|
@@ -71,12 +71,12 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
|
|
71 |
metric_for_best_model="accuracy",
|
72 |
greater_is_better=True,
|
73 |
logging_dir='/data/logs',
|
74 |
-
logging_steps=
|
75 |
#push_to_hub=True,
|
76 |
hub_model_id=hub_id.strip(),
|
77 |
fp16=True,
|
78 |
#lr_scheduler_type='cosine',
|
79 |
-
save_steps=
|
80 |
save_total_limit=3,
|
81 |
)
|
82 |
# Check if a checkpoint exists and load it
|
|
|
55 |
|
56 |
# Set training arguments
|
57 |
training_args = TrainingArguments(
|
58 |
+
torch_empty_cache_steps=100,
|
59 |
overwrite_output_dir=True,
|
60 |
output_dir='/data/results',
|
61 |
eval_strategy="steps", # Change this to steps
|
|
|
71 |
metric_for_best_model="accuracy",
|
72 |
greater_is_better=True,
|
73 |
logging_dir='/data/logs',
|
74 |
+
logging_steps=300,
|
75 |
#push_to_hub=True,
|
76 |
hub_model_id=hub_id.strip(),
|
77 |
fp16=True,
|
78 |
#lr_scheduler_type='cosine',
|
79 |
+
save_steps=300, # Save checkpoint every 500 steps
|
80 |
save_total_limit=3,
|
81 |
)
|
82 |
# Check if a checkpoint exists and load it
|