pere commited on
Commit
d29dd3e
1 Parent(s): cac60d2

ready to train

Browse files
__pycache__/tasks.cpython-38.pyc CHANGED
Binary files a/__pycache__/tasks.cpython-38.pyc and b/__pycache__/tasks.cpython-38.pyc differ
 
finetune_mt5_base.gin DELETED
@@ -1,17 +0,0 @@
1
- from __gin__ import dynamic_registration
2
-
3
- include 't5x/examples/t5/mt5/base.gin'
4
- include 't5x/configs/runs/finetune.gin'
5
-
6
- # Register necessary SeqIO Tasks/Mixtures.
7
- import t5.data.mixtures
8
-
9
- import tasks
10
-
11
- INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/mt5_base/checkpoint_1000000"
12
- MIXTURE_OR_TASK_NAME = "ncc_small_span_corruption"
13
- TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
14
- TRAIN_STEPS = 1100000
15
- DROPOUT_RATE = 0.0
16
- # BATCH_SIZE = 256
17
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
norwegian_base.gin CHANGED
@@ -1,7 +1,7 @@
1
  include 't5x/examples/t5/mt5/base.gin'
2
- #include 'pretrain_cont.gin'
3
  #include 't5x/configs/runs/pretrain.gin'
4
- include 't5x/configs/runs/finetune.gin'
5
 
6
 
7
  # Register necessary SeqIO Tasks/Mixtures.
@@ -12,6 +12,6 @@ MIXTURE_OR_TASK_NAME = "ncc_span_corruption_stream"
12
  TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
13
  TRAIN_STEPS = 1_100_000
14
  DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
15
- INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/mt5_xxl/checkpoint_1000000"
16
  #PjitPartitioner.num_partitions = 2
17
 
 
1
  include 't5x/examples/t5/mt5/base.gin'
2
+ include 'pretrain_cont.gin'
3
  #include 't5x/configs/runs/pretrain.gin'
4
+ #iinclude 't5x/configs/runs/finetune.gin'
5
 
6
 
7
  # Register necessary SeqIO Tasks/Mixtures.
 
12
  TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
13
  TRAIN_STEPS = 1_100_000
14
  DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
15
+ INITIAL_CHECKPOINT_PATH = "gs://t5-data/pretrained_models/t5x/mt5_base/checkpoint_1000000"
16
  #PjitPartitioner.num_partitions = 2
17
 
pretrain_cont.gin CHANGED
@@ -93,6 +93,7 @@ utils.CheckpointConfig:
93
  save = @utils.SaveCheckpointConfig()
94
  utils.RestoreCheckpointConfig:
95
  path = %INITIAL_CHECKPOINT_PATH
 
96
  dtype = 'float32'
97
  utils.SaveCheckpointConfig:
98
  period = 1000
 
93
  save = @utils.SaveCheckpointConfig()
94
  utils.RestoreCheckpointConfig:
95
  path = %INITIAL_CHECKPOINT_PATH
96
+ mode = 'specific'
97
  dtype = 'float32'
98
  utils.SaveCheckpointConfig:
99
  period = 1000
train_base.sh CHANGED
@@ -1,9 +1,9 @@
1
  PROJECT_DIR=${HOME}"/models/pk-nb-t5x"
2
  T5X_DIR="../../t5x" # directory where the t5x is cloned.
3
- MODEL_DIR="gs://nb-t5x-us-central2/pk_nb_t5x_base_test2"
4
  export PYTHONPATH=${PROJECT_DIR}
5
 
6
  python3 ${T5X_DIR}/t5x/train.py \
7
  --gin_search_paths=${PROJECT_DIR} \
8
- --gin_file="finetune_mt5_base.gin" \
9
  --gin.MODEL_DIR="'${MODEL_DIR}'" \
 
1
  PROJECT_DIR=${HOME}"/models/pk-nb-t5x"
2
  T5X_DIR="../../t5x" # directory where the t5x is cloned.
3
+ MODEL_DIR="gs://nb-t5x-us-central2/pk_nb_t5x_base_run1"
4
  export PYTHONPATH=${PROJECT_DIR}
5
 
6
  python3 ${T5X_DIR}/t5x/train.py \
7
  --gin_search_paths=${PROJECT_DIR} \
8
+ --gin_file="norwegian_base.gin" \
9
  --gin.MODEL_DIR="'${MODEL_DIR}'" \