Kevin Fink
commited on
Commit
·
d43fb9e
1
Parent(s):
d0bc2c3
deve
Browse files
app.py
CHANGED
@@ -190,7 +190,7 @@ def fine_tune_model(model, dataset_name, hub_id, api_key, num_epochs, batch_size
|
|
190 |
dataset['train'] = second_third
|
191 |
del dataset['test']
|
192 |
tokenized_sh_fq_dataset = dataset.map(tokenize_function, batched=True,)
|
193 |
-
dataset['validation'] =
|
194 |
saved_dataset = load_from_disk(f'/data/{hub_id.strip()}_train_dataset')
|
195 |
dataset['train'] = concatenate_datasets([saved_dataset, tokenized_sh_fq_dataset['train']])
|
196 |
dataset['train'].save_to_disk(f'/data/{hub_id.strip()}_train_dataset2')
|
|
|
190 |
dataset['train'] = second_third
|
191 |
del dataset['test']
|
192 |
tokenized_sh_fq_dataset = dataset.map(tokenize_function, batched=True,)
|
193 |
+
dataset['validation'] = dataset['validation'].map(tokenize_function, batched=True)
|
194 |
saved_dataset = load_from_disk(f'/data/{hub_id.strip()}_train_dataset')
|
195 |
dataset['train'] = concatenate_datasets([saved_dataset, tokenized_sh_fq_dataset['train']])
|
196 |
dataset['train'].save_to_disk(f'/data/{hub_id.strip()}_train_dataset2')
|