pere commited on
Commit
3cb2c20
1 Parent(s): 3ea67f4
parallel_train.jsonl → parallel_train.json RENAMED
File without changes
run_translation_t5_flax.py CHANGED
@@ -215,17 +215,7 @@ class DataTrainingArguments:
215
 
216
 
217
  summarization_name_mapping = {
218
- "amazon_reviews_multi": ("review_body", "review_title"),
219
- "big_patent": ("description", "abstract"),
220
- "cnn_dailymail": ("article", "highlights"),
221
- "orange_sum": ("text", "summary"),
222
- "pn_summary": ("article", "summary"),
223
- "psc": ("extract_text", "summary_text"),
224
- "samsum": ("dialogue", "summary"),
225
- "thaisum": ("body", "summary"),
226
- "xglue": ("news_body", "news_title"),
227
- "xsum": ("document", "summary"),
228
- "wiki_summary": ("article", "highlights"),
229
  }
230
 
231
 
@@ -407,7 +397,7 @@ def main():
407
  return
408
 
409
  # Get the column names for input/target.
410
- dataset_columns = summarization_name_mapping.get(data_args.dataset_name, None)
411
  if data_args.text_column is None:
412
  text_column = dataset_columns[0] if dataset_columns is not None else column_names[0]
413
  else:
 
215
 
216
 
217
  summarization_name_mapping = {
218
+ "translation": ("nb", "nn"),
 
 
 
 
 
 
 
 
 
 
219
  }
220
 
221
 
 
397
  return
398
 
399
  # Get the column names for input/target.
400
+ dataset_columns = summarization_name_mapping.get("translation", None)
401
  if data_args.text_column is None:
402
  text_column = dataset_columns[0] if dataset_columns is not None else column_names[0]
403
  else: