Kevin Fink commited on
Commit
d43fb9e
·
1 Parent(s): d0bc2c3
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -190,7 +190,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
190
  dataset['train'] = second_third
191
  del dataset['test']
192
  tokenized_sh_fq_dataset = dataset.map(tokenize_function, batched=True,)
193
- dataset['validation'] = tokenize_function(dataset['validation'])
194
  saved_dataset = load_from_disk(f'/data/{hub_id.strip()}_train_dataset')
195
  dataset['train'] = concatenate_datasets([saved_dataset, tokenized_sh_fq_dataset['train']])
196
  dataset['train'].save_to_disk(f'/data/{hub_id.strip()}_train_dataset2')
 
190
  dataset['train'] = second_third
191
  del dataset['test']
192
  tokenized_sh_fq_dataset = dataset.map(tokenize_function, batched=True,)
193
+ dataset['validation'] = dataset['validation'].map(tokenize_function, batched=True)
194
  saved_dataset = load_from_disk(f'/data/{hub_id.strip()}_train_dataset')
195
  dataset['train'] = concatenate_datasets([saved_dataset, tokenized_sh_fq_dataset['train']])
196
  dataset['train'].save_to_disk(f'/data/{hub_id.strip()}_train_dataset2')