pere commited on
Commit
f0adc7d
1 Parent(s): ece75fb

failed script

Browse files
events.out.tfevents.1626538069.t1v-n-4e27a527-w-0.76098.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:367d20009fec797ec8f588fa9bee718bf9c3cf3c0607dd97627eeaa4f8e9dfff
3
+ size 40
run.sh CHANGED
@@ -1,17 +1,16 @@
1
  python run_clm_mp.py \
2
  --model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
3
- --tokenizer_name /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
4
- --train_file /mnt/disks/flaxdisk/corpus/social_train.json \
5
- --validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
6
  --do_train \
7
  --do_eval \
8
  --block_size 1024 \
9
- --num_train_epochs 10 \
10
  --learning_rate 4e-6 \
11
  --per_device_train_batch_size 3 \
12
  --per_device_eval_batch_size 3 \
13
  --overwrite_output_dir \
14
- --output_dir /mnt/disks/flaxdisk/norwegian-gptneo-red \
15
  --cache_dir /mnt/disks/flaxdisk/cache/ \
16
  --dtype bfloat16 \
17
  --logging_steps 97 \
 
1
  python run_clm_mp.py \
2
  --model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
3
+ --tokenizer_name gpt2 \
4
+ --dataset_name wikitext --dataset_config_name wikitext-2-raw-v1 \
 
5
  --do_train \
6
  --do_eval \
7
  --block_size 1024 \
8
+ --num_train_epochs 5 \
9
  --learning_rate 4e-6 \
10
  --per_device_train_batch_size 3 \
11
  --per_device_eval_batch_size 3 \
12
  --overwrite_output_dir \
13
+ --output_dir /mnt/disks/flaxdisk/output/ \
14
  --cache_dir /mnt/disks/flaxdisk/cache/ \
15
  --dtype bfloat16 \
16
  --logging_steps 97 \
run_bak.sh ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ python run_clm_mp.py \
2
+ --model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
3
+ --tokenizer_name /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
4
+ --train_file /mnt/disks/flaxdisk/corpus/social_train.json \
5
+ --validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
6
+ --do_train \
7
+ --do_eval \
8
+ --block_size 1024 \
9
+ --num_train_epochs 5 \
10
+ --learning_rate 4e-6 \
11
+ --per_device_train_batch_size 3 \
12
+ --per_device_eval_batch_size 3 \
13
+ --overwrite_output_dir \
14
+ --output_dir /mnt/disks/flaxdisk/output/ \
15
+ --cache_dir /mnt/disks/flaxdisk/cache/ \
16
+ --dtype bfloat16 \
17
+ --logging_steps 97 \
18
+ --eval_steps 96\
19
+ --push_to_hub
run_bak2.sh ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ python run_clm_mp.py \
2
+ --model_name_or_path /mnt/disks/flaxdisk/norwegian-gptneo-red/ \
3
+ --tokenizer_name gpt2 \
4
+ --dataset_name wikitext --dataset_config_name wikitext-2-raw-v1 \
5
+ #--train_file /mnt/disks/flaxdisk/corpus/social_train.json \
6
+ #--validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
7
+ --do_train \
8
+ --do_eval \
9
+ --block_size 1024 \
10
+ --num_train_epochs 5 \
11
+ --learning_rate 4e-6 \
12
+ --per_device_train_batch_size 3 \
13
+ --per_device_eval_batch_size 3 \
14
+ --overwrite_output_dir \
15
+ --output_dir /mnt/disks/flaxdisk/output/ \
16
+ --cache_dir /mnt/disks/flaxdisk/cache/ \
17
+ --dtype bfloat16 \
18
+ --logging_steps 97 \
19
+ --eval_steps 96\
20
+ --push_to_hub