Kevin Fink commited on
Commit
0ad10bb
·
1 Parent(s): d52c194
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -217,8 +217,8 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
217
  dataset = load_dataset(dataset_name.strip())
218
 
219
  #dataset['train'] = dataset['train'].select(range(8000))
220
- dataset['train'] = dataset['train'].select(range(4000))
221
- dataset['validation'] = dataset['validation'].select(range(200))
222
  train_set = dataset.map(tokenize_function, batched=True)
223
  #valid_set = dataset['validation'].map(tokenize_function, batched=True)
224
 
@@ -235,7 +235,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
235
  eval_dataset=train_set['validation'],
236
  compute_metrics=compute_metrics,
237
  #data_collator=data_collator,
238
- processing_class=tokenizer,
239
  )
240
 
241
  # Fine-tune the model
 
217
  dataset = load_dataset(dataset_name.strip())
218
 
219
  #dataset['train'] = dataset['train'].select(range(8000))
220
+ dataset['train'] = dataset['train'].select(range(1000))
221
+ dataset['validation'] = dataset['validation'].select(range(100))
222
  train_set = dataset.map(tokenize_function, batched=True)
223
  #valid_set = dataset['validation'].map(tokenize_function, batched=True)
224
 
 
235
  eval_dataset=train_set['validation'],
236
  compute_metrics=compute_metrics,
237
  #data_collator=data_collator,
238
+ #processing_class=tokenizer,
239
  )
240
 
241
  # Fine-tune the model