summary all
Browse files- __pycache__/my_metrics.cpython-38.pyc +0 -0
- summary_all_scandflan_base.sh +14 -0
- tasks.py +16 -0
__pycache__/my_metrics.cpython-38.pyc
DELETED
Binary file (446 Bytes)
|
|
summary_all_scandflan_base.sh
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
PROJECT_DIR=${HOME}"/models/t5-summary"
|
2 |
+
export PYTHONPATH=${PROJECT_DIR}
|
3 |
+
INITIAL_CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/exp5-t5-base-ul2-scandvoc-full/checkpoint_1500000\"
|
4 |
+
TRAIN_STEPS=1550000
|
5 |
+
|
6 |
+
|
7 |
+
|
8 |
+
python3 ../../t5x/t5x/train.py \
|
9 |
+
--gin_search_paths="./" \
|
10 |
+
--gin.TRAIN_STEPS=${TRAIN_STEPS} \
|
11 |
+
--gin_file="finetune_summary_scandflan_base.gin" \
|
12 |
+
--gin.MIXTURE_OR_TASK_NAME=\"summary_all_scand\" \
|
13 |
+
--gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/summary_scandflan_all_base\" \
|
14 |
+
--gin.INITIAL_CHECKPOINT_PATH=${INITIAL_CHECKPOINT_PATH} \
|
tasks.py
CHANGED
@@ -247,4 +247,20 @@ seqio.TaskRegistry.add(
|
|
247 |
metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
|
248 |
output_features=MT5_OUTPUT_FEATURES,
|
249 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
250 |
|
|
|
247 |
metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
|
248 |
output_features=MT5_OUTPUT_FEATURES,
|
249 |
)
|
250 |
+
seqio.TaskRegistry.add(
|
251 |
+
"summary_all_scand",
|
252 |
+
source=seqio.TextLineDataSource(
|
253 |
+
split_to_filepattern=tsv_summary_all_path,
|
254 |
+
#num_input_examples=num_nq_examples
|
255 |
+
),
|
256 |
+
preprocessors=[
|
257 |
+
functools.partial(
|
258 |
+
t5.data.preprocessors.parse_tsv,
|
259 |
+
field_names=["source","target"]),
|
260 |
+
categorise_preprocessor,
|
261 |
+
seqio.preprocessors.tokenize_and_append_eos,
|
262 |
+
],
|
263 |
+
metric_fns=[metrics.accuracy,my_metrics.f1_macro,metrics.bleu,metrics.rouge],
|
264 |
+
output_features=SCAND_OUTPUT_FEATURES,
|
265 |
+
)
|
266 |
|