inflaton commited on
Commit
a36def6
·
1 Parent(s): ceb9311
data/Qwen2.5-3B-Instruct_results.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/Qwen2.5-7B-Instruct_results.csv ADDED
The diff for this file is too large to render. See raw diff
 
llama-factory/config/models/Qwen2.5-72B-Instruct.yaml ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ### model
2
+ model_name_or_path: Qwen/Qwen2.5-72B-Instruct
3
+ quantization_bit: 4
4
+
5
+ ### method
6
+ stage: sft
7
+ do_train: true
8
+ finetuning_type: lora
9
+ lora_target: all
10
+
11
+ ### dataset
12
+ dataset: alpaca_mgtv_p2
13
+ template: qwen
14
+ cutoff_len: 8192
15
+ max_samples: 25000
16
+ overwrite_cache: true
17
+ preprocessing_num_workers: 16
18
+
19
+ ### output
20
+ output_dir: saves/Qwen2.5-72B-Instruct
21
+ logging_steps: 5
22
+ save_steps: 35
23
+ plot_loss: true
24
+ # overwrite_output_dir: true
25
+
26
+ ### train
27
+ per_device_train_batch_size: 16
28
+ gradient_accumulation_steps: 8
29
+ learning_rate: 1.0e-4
30
+ num_train_epochs: 2.0
31
+ lr_scheduler_type: cosine
32
+ warmup_ratio: 0.1
33
+ bf16: true
34
+ ddp_timeout: 180000000
35
+
36
+ ### eval
37
+ val_size: 0.1
38
+ per_device_eval_batch_size: 1
39
+ eval_strategy: steps
40
+ eval_steps: 35
41
+
42
+ report_to: wandb
43
+ run_name: Qwen2.5-72B-Instruct_lora_sft
logs/Qwen2.5-7B-Instruct_epoch_1.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eb21a1e6bba7f6b3162293b01cdf4f80e81044342a1afc90cef71d87cca1d04
3
+ size 17547
logs/Qwen2.5-7B-Instruct_epoch_10.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c18b323927342384b5c2916642be7100cd68558b01afddc576a89f26b5574a38
3
+ size 17397
logs/Qwen2.5-7B-Instruct_epoch_2.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d679717eeb115236b3dbd71be9c0889d7089433d81007032d2c8bc03759fcdc8
3
+ size 17597
logs/Qwen2.5-7B-Instruct_epoch_3.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8190376a1eed3d4cc0fa2304daf6b5905ca4875a0c989085113de79c49a50ec
3
+ size 17490
logs/Qwen2.5-7B-Instruct_epoch_4.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28c5cfd7853d62cacd618ae27fbb9acb453ac02af0eef1b5d618abb8bdbc6cac
3
+ size 17473
logs/Qwen2.5-7B-Instruct_epoch_5.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e79deb7310a05eb990f0ab88ef28dbe5fbbaab6de5932f95734266889f750cf6
3
+ size 17122
logs/Qwen2.5-7B-Instruct_epoch_6.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbb92e8dc536224b47d905ffc52851bbfcab8e73702461a51a46f8a985158129
3
+ size 17600
logs/Qwen2.5-7B-Instruct_epoch_7.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34aa91ae94e34308c1bcc116cf77da85f053df27f5660cca32aa0f9c2869b9ce
3
+ size 17537
logs/Qwen2.5-7B-Instruct_epoch_8.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a61e5ccb7a9ae5f2b8e34680783e080f67a11062bcb50f1c6fc99efd226694f
3
+ size 17416
logs/Qwen2.5-7B-Instruct_epoch_9.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c79c85037b52efc95d14b735cb70bae41350275c74da60656d21b661bb01411
3
+ size 17418
scripts/eval-mgtv-qwen2.5.sh CHANGED
@@ -13,13 +13,13 @@ cat /etc/os-release
13
  lscpu
14
  grep MemTotal /proc/meminfo
15
 
 
16
  $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-7B-Instruct
17
 
18
- $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-7B-Instruct
19
 
20
  # $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-3B-Instruct
21
 
22
- $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-3B-Instruct
23
 
24
  # $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-1.5B-Instruct
25
 
 
13
  lscpu
14
  grep MemTotal /proc/meminfo
15
 
16
+ $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-7B-Instruct
17
  $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-7B-Instruct
18
 
 
19
 
20
  # $BASEDIR/scripts/eval-shots.sh Qwen Qwen2.5-3B-Instruct
21
 
22
+ #$BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-3B-Instruct
23
 
24
  # $BASEDIR/scripts/eval-epochs.sh Qwen Qwen2.5-1.5B-Instruct
25
 
scripts/eval-mgtv.sh CHANGED
@@ -1 +1 @@
1
- eval-mgtv-shots_4bit.sh
 
1
+ eval-mgtv-qwen2.5.sh