Kevin Fink
commited on
Commit
·
0ad10bb
1
Parent(s):
d52c194
deve
Browse files
app.py
CHANGED
@@ -217,8 +217,8 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
|
|
217 |
dataset = load_dataset(dataset_name.strip())
|
218 |
|
219 |
#dataset['train'] = dataset['train'].select(range(8000))
|
220 |
-
dataset['train'] = dataset['train'].select(range(
|
221 |
-
dataset['validation'] = dataset['validation'].select(range(
|
222 |
train_set = dataset.map(tokenize_function, batched=True)
|
223 |
#valid_set = dataset['validation'].map(tokenize_function, batched=True)
|
224 |
|
@@ -235,7 +235,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
|
|
235 |
eval_dataset=train_set['validation'],
|
236 |
compute_metrics=compute_metrics,
|
237 |
#data_collator=data_collator,
|
238 |
-
processing_class=tokenizer,
|
239 |
)
|
240 |
|
241 |
# Fine-tune the model
|
|
|
217 |
dataset = load_dataset(dataset_name.strip())
|
218 |
|
219 |
#dataset['train'] = dataset['train'].select(range(8000))
|
220 |
+
dataset['train'] = dataset['train'].select(range(1000))
|
221 |
+
dataset['validation'] = dataset['validation'].select(range(100))
|
222 |
train_set = dataset.map(tokenize_function, batched=True)
|
223 |
#valid_set = dataset['validation'].map(tokenize_function, batched=True)
|
224 |
|
|
|
235 |
eval_dataset=train_set['validation'],
|
236 |
compute_metrics=compute_metrics,
|
237 |
#data_collator=data_collator,
|
238 |
+
#processing_class=tokenizer,
|
239 |
)
|
240 |
|
241 |
# Fine-tune the model
|