Spaces:

inflaton-ai
/

logical-reasoning

Build error

dh-mc commited on Jul 18, 2024

Commit

16974cb

1 Parent(s): c4388ab

llama3 epoch 6 shows promising results; adding 4 epochs

Files changed (8) hide show

competition/00a_InternLM_2.5_Results.ipynb CHANGED Viewed

The diff for this file is too large to render. See raw diff

competition/11_Llama-3_8b_analysis.ipynb CHANGED Viewed

The diff for this file is too large to render. See raw diff

competition/11a_Llama-3_8b_p2_analysis.ipynb CHANGED Viewed

The diff for this file is too large to render. See raw diff

llama-factory/config/llama3-8b_lora_sft_bf16-p1.yaml CHANGED Viewed

@@ -25,13 +25,13 @@ output_dir: saves/llama3-8b/lora/sft_bf16_p1_full
 logging_steps: 10
 save_steps: 175
 plot_loss: true
-overwrite_output_dir: true
 ### train
 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
-num_train_epochs: 6.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true

 logging_steps: 10
 save_steps: 175
 plot_loss: true
+# overwrite_output_dir: true
 ### train
 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
+num_train_epochs: 10.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true

llama-factory/config/llama3-8b_lora_sft_bf16-p2.yaml CHANGED Viewed

@@ -31,7 +31,7 @@ plot_loss: true
 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
-num_train_epochs: 6.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true

 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
+num_train_epochs: 10.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true

results/mgtv-llama3_p1_full_metrics.csv CHANGED Viewed

@@ -1,4 +1,8 @@
 epoch,model,accuracy,precision,recall,f1
 0,shenzhi-wang/Llama3-8B-Chinese-Chat,0.7836666666666666,0.7667122897184859,0.7929173693086004,0.7679400621793133
-1,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-175,0.5686666666666667,0.8071228551961105,0.5686666666666667,0.625398807088777
-2,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-350,0.7043333333333334,0.8108167278539298,0.7043333333333334,0.7421863499027709

 epoch,model,accuracy,precision,recall,f1
 0,shenzhi-wang/Llama3-8B-Chinese-Chat,0.7836666666666666,0.7667122897184859,0.7929173693086004,0.7679400621793133
+1,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-175,0.292,0.7244497001864332,0.292,0.39603584197818525
+2,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-350,0.314,0.8230975844189062,0.314,0.44460745309834776
+3,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-525,,,,
+4,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-700,0.0,0.0,0.0,0.0
+5,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-875,,,,
+6,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-1050,0.5506666666666666,0.7209974218469999,0.5506666666666666,0.6017622173499129

results/mgtv-llama3_p2_full_metrics.csv CHANGED Viewed

@@ -1,5 +1,8 @@
 epoch,model,accuracy,precision,recall,f1
 0,shenzhi-wang/Llama3-8B-Chinese-Chat,0.73,0.7709739363586101,0.73,0.7462914191370829
-1,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-175,0.773,0.7739158621170704,0.773,0.7642801051494378
-2,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-350,0.7046666666666667,0.814516278555831,0.7046666666666667,0.7453647242165446
-3,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-525,0.6793333333333333,0.8030704466494853,0.6793333333333333,0.7246368106499855

 epoch,model,accuracy,precision,recall,f1
 0,shenzhi-wang/Llama3-8B-Chinese-Chat,0.73,0.7709739363586101,0.73,0.7462914191370829
+1,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-175,,,,
+2,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-350,,,,
+3,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-525,,,,
+4,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-700,,,,
+5,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-875,,,,
+6,shenzhi-wang/Llama3-8B-Chinese-Chat_checkpoint-1050,0.6656666666666666,0.7924121951113166,0.6656666666666666,0.7124311215236507

scripts/eval-mgtv-llama3_8b.sh CHANGED Viewed

@@ -18,7 +18,7 @@ grep MemTotal /proc/meminfo
 export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
 export RESIZE_TOKEN_EMBEDDINGS=true
-export START_EPOCH=1
 #export MODEL_NAME=FlagAlpha/Llama3-Chinese-8B-Instruct
 export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat

 export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
 export RESIZE_TOKEN_EMBEDDINGS=true
+export START_EPOCH=7
 #export MODEL_NAME=FlagAlpha/Llama3-Chinese-8B-Instruct
 export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat