pere commited on
Commit
e5e15cf
1 Parent(s): 91f0b3d

summary all

Browse files
__pycache__/my_metrics.cpython-38.pyc DELETED
Binary file (446 Bytes)
 
summary_all_scandflan_base.sh ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ PROJECT_DIR=${HOME}"/models/t5-summary"
2
+ export PYTHONPATH=${PROJECT_DIR}
3
+ INITIAL_CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/exp5-t5-base-ul2-scandvoc-full/checkpoint_1500000\"
4
+ TRAIN_STEPS=1550000
5
+
6
+
7
+
8
+ python3 ../../t5x/t5x/train.py \
9
+ --gin_search_paths="./" \
10
+ --gin.TRAIN_STEPS=${TRAIN_STEPS} \
11
+ --gin_file="finetune_summary_scandflan_base.gin" \
12
+ --gin.MIXTURE_OR_TASK_NAME=\"summary_all_scand\" \
13
+ --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/summary_scandflan_all_base\" \
14
+ --gin.INITIAL_CHECKPOINT_PATH=${INITIAL_CHECKPOINT_PATH} \
tasks.py CHANGED
@@ -247,4 +247,20 @@ seqio.TaskRegistry.add(
247
  metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
248
  output_features=MT5_OUTPUT_FEATURES,
249
  )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
250
 
 
247
  metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
248
  output_features=MT5_OUTPUT_FEATURES,
249
  )
250
+ seqio.TaskRegistry.add(
251
+ "summary_all_scand",
252
+ source=seqio.TextLineDataSource(
253
+ split_to_filepattern=tsv_summary_all_path,
254
+ #num_input_examples=num_nq_examples
255
+ ),
256
+ preprocessors=[
257
+ functools.partial(
258
+ t5.data.preprocessors.parse_tsv,
259
+ field_names=["source","target"]),
260
+ categorise_preprocessor,
261
+ seqio.preprocessors.tokenize_and_append_eos,
262
+ ],
263
+ metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
264
+ output_features=SCAND_OUTPUT_FEATURES,
265
+ )
266