ready to train
Browse files- __pycache__/tasks.cpython-38.pyc +0 -0
- finetune_mt5_base.gin +0 -17
- norwegian_base.gin +3 -3
- pretrain_cont.gin +1 -0
- train_base.sh +2 -2
__pycache__/tasks.cpython-38.pyc
CHANGED
Binary files a/__pycache__/tasks.cpython-38.pyc and b/__pycache__/tasks.cpython-38.pyc differ
|
|
finetune_mt5_base.gin
DELETED
@@ -1,17 +0,0 @@
|
|
1 |
-
from __gin__ import dynamic_registration
|
2 |
-
|
3 |
-
include 't5x/examples/t5/mt5/base.gin'
|
4 |
-
include 't5x/configs/runs/finetune.gin'
|
5 |
-
|
6 |
-
# Register necessary SeqIO Tasks/Mixtures.
|
7 |
-
import t5.data.mixtures
|
8 |
-
|
9 |
-
import tasks
|
10 |
-
|
11 |
-
INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/mt5_base/checkpoint_1000000"
|
12 |
-
MIXTURE_OR_TASK_NAME = "ncc_small_span_corruption"
|
13 |
-
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
14 |
-
TRAIN_STEPS = 1100000
|
15 |
-
DROPOUT_RATE = 0.0
|
16 |
-
# BATCH_SIZE = 256
|
17 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
norwegian_base.gin
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
include 't5x/examples/t5/mt5/base.gin'
|
2 |
-
|
3 |
#include 't5x/configs/runs/pretrain.gin'
|
4 |
-
|
5 |
|
6 |
|
7 |
# Register necessary SeqIO Tasks/Mixtures.
|
@@ -12,6 +12,6 @@ MIXTURE_OR_TASK_NAME = "ncc_span_corruption_stream"
|
|
12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
13 |
TRAIN_STEPS = 1_100_000
|
14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
15 |
-
INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/
|
16 |
#PjitPartitioner.num_partitions = 2
|
17 |
|
|
|
1 |
include 't5x/examples/t5/mt5/base.gin'
|
2 |
+
include 'pretrain_cont.gin'
|
3 |
#include 't5x/configs/runs/pretrain.gin'
|
4 |
+
#iinclude 't5x/configs/runs/finetune.gin'
|
5 |
|
6 |
|
7 |
# Register necessary SeqIO Tasks/Mixtures.
|
|
|
12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
13 |
TRAIN_STEPS = 1_100_000
|
14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
15 |
+
INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/mt5_base/checkpoint_1000000"
|
16 |
#PjitPartitioner.num_partitions = 2
|
17 |
|
pretrain_cont.gin
CHANGED
@@ -93,6 +93,7 @@ utils.CheckpointConfig:
|
|
93 |
save = @utils.SaveCheckpointConfig()
|
94 |
utils.RestoreCheckpointConfig:
|
95 |
path = %INITIAL_CHECKPOINT_PATH
|
|
|
96 |
dtype = 'float32'
|
97 |
utils.SaveCheckpointConfig:
|
98 |
period = 1000
|
|
|
93 |
save = @utils.SaveCheckpointConfig()
|
94 |
utils.RestoreCheckpointConfig:
|
95 |
path = %INITIAL_CHECKPOINT_PATH
|
96 |
+
mode = 'specific'
|
97 |
dtype = 'float32'
|
98 |
utils.SaveCheckpointConfig:
|
99 |
period = 1000
|
train_base.sh
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
PROJECT_DIR=${HOME}"/models/pk-nb-t5x"
|
2 |
T5X_DIR="../../t5x" # directory where the t5x is cloned.
|
3 |
-
MODEL_DIR="gs://nb-t5x-us-central2/
|
4 |
export PYTHONPATH=${PROJECT_DIR}
|
5 |
|
6 |
python3 ${T5X_DIR}/t5x/train.py \
|
7 |
--gin_search_paths=${PROJECT_DIR} \
|
8 |
-
--gin_file="
|
9 |
--gin.MODEL_DIR="'${MODEL_DIR}'" \
|
|
|
1 |
PROJECT_DIR=${HOME}"/models/pk-nb-t5x"
|
2 |
T5X_DIR="../../t5x" # directory where the t5x is cloned.
|
3 |
+
MODEL_DIR="gs://nb-t5x-us-central2/pk_nb_t5x_base_run1"
|
4 |
export PYTHONPATH=${PROJECT_DIR}
|
5 |
|
6 |
python3 ${T5X_DIR}/t5x/train.py \
|
7 |
--gin_search_paths=${PROJECT_DIR} \
|
8 |
+
--gin_file="norwegian_base.gin" \
|
9 |
--gin.MODEL_DIR="'${MODEL_DIR}'" \
|