pere commited on
Commit
57a778a
1 Parent(s): 556e14e

batch scripts

Browse files
batch_sentiment_base.sh CHANGED
@@ -1,21 +1,22 @@
1
  PROJECT_DIR=${HOME}"/models/t5-parliament-categorisation"
2
  export PYTHONPATH=${PROJECT_DIR}
3
 
4
- python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\" &&
5
- python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v2_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\" &&
6
- python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\" &&
7
- python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\" &&
8
- python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\" &&
9
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v1_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
10
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v2_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
11
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v3_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
12
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v4_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
13
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v5_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
14
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v1_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
15
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v2_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
16
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v3_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
17
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v4_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
18
- python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/v5_finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\" &&
 
19
 
20
 
21
 
 
1
  PROJECT_DIR=${HOME}"/models/t5-parliament-categorisation"
2
  export PYTHONPATH=${PROJECT_DIR}
3
 
4
+ #python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\"
5
+ python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v2_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\"
6
+ #python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\"
7
+ #python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\"
8
+ #python3 ../../t5x/t5x/train.py --gin_search_paths="./" --gin_file="finetune_categorisation_base.gin" --gin.MIXTURE_OR_TASK_NAME=\"sentiment\" --gin.MODEL_DIR=\"gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment\"
9
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
10
+ python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v2_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
11
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
12
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
13
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"validation\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
14
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
15
+ python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v2_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
16
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
17
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
18
+ #python3 eval.py --gin_search_paths="./" --gin_file="eval_categorisation_base.gin" --gin.SPLIT=\"test\" --gin.CHECKPOINT_PATH=\"gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000\"
19
+
20
 
21
 
22
 
eval_categorisation_base.gin CHANGED
@@ -12,7 +12,7 @@ CHECKPOINT_PATH = %gin.REQUIRED # passed via commandline
12
  SPLIT = %gin.REQUIRED # passed via commandline
13
  EVAL_OUTPUT_DIR = "./log/"
14
  DROPOUT_RATE = 0.0 # unused boilerplate
15
- MIXTURE_OR_TASK_NAME = "parliament"
16
 
17
  eval_script.evaluate:
18
  model = %MODEL # imported from separate gin file
 
12
  SPLIT = %gin.REQUIRED # passed via commandline
13
  EVAL_OUTPUT_DIR = "./log/"
14
  DROPOUT_RATE = 0.0 # unused boilerplate
15
+ MIXTURE_OR_TASK_NAME = "sentiment"
16
 
17
  eval_script.evaluate:
18
  model = %MODEL # imported from separate gin file
log/config.gin CHANGED
@@ -12,15 +12,15 @@ import tasks
12
  # Macros:
13
  # ==============================================================================
14
  CHECKPOINT_PATH = \
15
- 'gs://nb-t5x-us-central2/finetuned/norwegian_NCC_plus_English_t5x_base_1_500_000_parliament/checkpoint_1510000'
16
  DROPOUT_RATE = 0.0
17
  EVAL_OUTPUT_DIR = './log/'
18
  LABEL_SMOOTHING = 0.0
19
  LOSS_NORMALIZING_FACTOR = None
20
- MIXTURE_OR_TASK_NAME = 'parliament'
21
  MODEL = @models.EncoderDecoderModel()
22
  OPTIMIZER = @adafactor.Adafactor()
23
- SPLIT = 'validation'
24
  VOCABULARY = @seqio.SentencePieceVocabulary()
25
  Z_LOSS = 0.0001
26
 
 
12
  # Macros:
13
  # ==============================================================================
14
  CHECKPOINT_PATH = \
15
+ 'gs://nb-t5x-us-central2/finetuned/v2_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000'
16
  DROPOUT_RATE = 0.0
17
  EVAL_OUTPUT_DIR = './log/'
18
  LABEL_SMOOTHING = 0.0
19
  LOSS_NORMALIZING_FACTOR = None
20
+ MIXTURE_OR_TASK_NAME = 'sentiment'
21
  MODEL = @models.EncoderDecoderModel()
22
  OPTIMIZER = @adafactor.Adafactor()
23
+ SPLIT = 'test'
24
  VOCABULARY = @seqio.SentencePieceVocabulary()
25
  Z_LOSS = 0.0001
26
 
log/eval_results_t1v-n-7b23714e-w-0.jsonl CHANGED
@@ -3,3 +3,17 @@
3
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1510000", "task": "categorise", "eval_date": "11-04-2022 07:49:05", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 86.5, "f1_macro": 86.49816224986179}}
4
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1510000", "task": "categorise", "eval_date": "11-04-2022 07:51:08", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.25, "f1_macro": 85.2425290303216}}
5
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1505000", "task": "categorise", "eval_date": "11-04-2022 08:13:36", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.25, "f1_macro": 85.24014985000407}}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1510000", "task": "categorise", "eval_date": "11-04-2022 07:49:05", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 86.5, "f1_macro": 86.49816224986179}}
4
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1510000", "task": "categorise", "eval_date": "11-04-2022 07:51:08", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.25, "f1_macro": 85.2425290303216}}
5
  {"model": "gs://nb-t5x-us-central2/finetuned/norwegian_NCC_pluss_english_1_500_000/checkpoint_1505000", "task": "categorise", "eval_date": "11-04-2022 08:13:36", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.25, "f1_macro": 85.24014985000407}}
6
+ {"model": "gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:13:47", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 51.74999999999999, "f1_macro": 51.71777832289466}}
7
+ {"model": "gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:15:07", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 50.83333333333333, "f1_macro": 50.79383171490447}}
8
+ {"model": "gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:16:13", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 51.583333333333336, "f1_macro": 51.03489009889238}}
9
+ {"model": "gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:17:21", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 52.25, "f1_macro": 52.24253789654634}}
10
+ {"model": "gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:19:04", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 52.0, "f1_macro": 51.92307692307692}}
11
+ {"model": "gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:20:24", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 51.583333333333336, "f1_macro": 51.555040131076545}}
12
+ {"model": "gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "parliament", "eval_date": "13-04-2022 13:21:38", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 50.74999999999999, "f1_macro": 50.43938573350337}}
13
+ {"model": "gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 13:51:56", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 84.88372093023256, "f1_macro": 82.33497191011236}}
14
+ {"model": "gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 13:53:25", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.07751937984496, "f1_macro": 82.7653067863882}}
15
+ {"model": "gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 13:54:36", "split": "validation", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.85271317829456, "f1_macro": 83.60657164617561}}
16
+ {"model": "gs://nb-t5x-us-central2/finetuned/v1_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 14:01:28", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 87.29016786570743, "f1_macro": 84.21729163839953}}
17
+ {"model": "gs://nb-t5x-us-central2/finetuned/v3_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 14:03:06", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 84.89208633093526, "f1_macro": 81.23942213621073}}
18
+ {"model": "gs://nb-t5x-us-central2/finetuned/v4_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 14:04:20", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 85.61151079136691, "f1_macro": 82.17948717948718}}
19
+ {"model": "gs://nb-t5x-us-central2/finetuned/v5_norwegian_NCC_plus_English_t5x_base_1_500_000_sentiment/checkpoint_1510000", "task": "sentiment", "eval_date": "13-04-2022 14:05:39", "split": "test", "feature_length": {"inputs": 512, "targets": 2}, "eval_batch_size": 16, "result": {"accuracy": 80.0959232613909, "f1_macro": 74.5979905029614}}
log/sentiment-metrics.jsonl ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"step": 1501000, "accuracy": 71.12403100775194, "f1_macro": 51.34385976014934}
2
+ {"step": 1502000, "accuracy": 85.65891472868216, "f1_macro": 83.4095135473331}
3
+ {"step": 1503000, "accuracy": 85.65891472868216, "f1_macro": 83.24087078651685}
4
+ {"step": 1504000, "accuracy": 85.65891472868216, "f1_macro": 83.4095135473331}
5
+ {"step": 1505000, "accuracy": 86.04651162790698, "f1_macro": 83.57966197581501}
6
+ {"step": 1506000, "accuracy": 85.85271317829456, "f1_macro": 83.60657164617561}
7
+ {"step": 1507000, "accuracy": 85.27131782945736, "f1_macro": 82.90437329985352}
8
+ {"step": 1508000, "accuracy": 85.46511627906976, "f1_macro": 83.10095324597064}
9
+ {"step": 1509000, "accuracy": 84.88372093023256, "f1_macro": 82.5127304958376}
10
+ {"step": 1510000, "accuracy": 85.27131782945736, "f1_macro": 82.72818561386819}