Jerry Ji commited on
Commit
2584321
·
1 Parent(s): 9d693d7

Training in progress, epoch 0

Browse files
adapter_config.json CHANGED
@@ -16,10 +16,10 @@
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
- "o_proj",
20
- "q_proj",
21
  "v_proj",
22
- "k_proj"
 
 
23
  ],
24
  "task_type": "CAUSAL_LM"
25
  }
 
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
 
 
19
  "v_proj",
20
+ "q_proj",
21
+ "k_proj",
22
+ "o_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
25
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fcd987e4295cf39204d499f3d64718c79f91cd5edcd56838915d9b76fbfe4dc
3
  size 218138576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b406044886581aee396c928a6e0154eb09cc26550ff19e5930abfb44a682b43b
3
  size 218138576
all_results.json CHANGED
@@ -1,21 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_logits/chosen": -3.0078587532043457,
4
- "eval_logits/rejected": -3.042999744415283,
5
- "eval_logps/chosen": -194.36697387695312,
6
- "eval_logps/rejected": -179.82501220703125,
7
- "eval_loss": 0.6931471824645996,
8
- "eval_rewards/accuracies": 0.0,
9
- "eval_rewards/chosen": 0.0,
10
- "eval_rewards/margins": 0.0,
11
- "eval_rewards/rejected": 0.0,
12
- "eval_runtime": 5.0964,
13
- "eval_samples": 10,
14
- "eval_samples_per_second": 1.962,
15
- "eval_steps_per_second": 0.392,
16
- "train_loss": 0.3465735912322998,
17
- "train_runtime": 16.8017,
18
  "train_samples": 61966,
19
- "train_samples_per_second": 0.595,
20
- "train_steps_per_second": 0.06
21
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 19.057324022054672,
4
+ "train_runtime": 626.0842,
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.799,
7
+ "train_steps_per_second": 0.026
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.3465735912322998,
4
- "train_runtime": 16.8017,
5
  "train_samples": 61966,
6
- "train_samples_per_second": 0.595,
7
- "train_steps_per_second": 0.06
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 19.057324022054672,
4
+ "train_runtime": 626.0842,
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.799,
7
+ "train_steps_per_second": 0.026
8
  }
trainer_state.json CHANGED
@@ -3,53 +3,67 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
  "eval_steps": 100,
6
- "global_step": 1,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "learning_rate": 0.0,
14
- "logits/chosen": -3.053490400314331,
15
- "logits/rejected": -3.094686985015869,
16
- "logps/chosen": -181.32530212402344,
17
- "logps/rejected": -175.11618041992188,
18
- "loss": 0.3466,
19
  "rewards/accuracies": 0.0,
20
  "rewards/chosen": 0.0,
21
  "rewards/margins": 0.0,
22
  "rewards/rejected": 0.0,
23
  "step": 1
24
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  {
26
  "epoch": 1.0,
27
- "eval_logits/chosen": -3.0078587532043457,
28
- "eval_logits/rejected": -3.042999744415283,
29
- "eval_logps/chosen": -194.36697387695312,
30
- "eval_logps/rejected": -179.82501220703125,
31
- "eval_loss": 0.6931471824645996,
32
- "eval_rewards/accuracies": 0.0,
33
- "eval_rewards/chosen": 0.0,
34
- "eval_rewards/margins": 0.0,
35
- "eval_rewards/rejected": 0.0,
36
- "eval_runtime": 5.1666,
37
- "eval_samples_per_second": 1.936,
38
- "eval_steps_per_second": 0.387,
39
- "step": 1
40
  },
41
  {
42
  "epoch": 1.0,
43
- "step": 1,
44
  "total_flos": 0.0,
45
- "train_loss": 0.3465735912322998,
46
- "train_runtime": 16.8017,
47
- "train_samples_per_second": 0.595,
48
- "train_steps_per_second": 0.06
49
  }
50
  ],
51
  "logging_steps": 10,
52
- "max_steps": 1,
53
  "num_train_epochs": 1,
54
  "save_steps": 500,
55
  "total_flos": 0.0,
 
3
  "best_model_checkpoint": null,
4
  "epoch": 1.0,
5
  "eval_steps": 100,
6
+ "global_step": 16,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.06,
13
+ "learning_rate": 0.00025,
14
+ "logits/chosen": -3.027029514312744,
15
+ "logits/rejected": -3.115102767944336,
16
+ "logps/chosen": -313.0743103027344,
17
+ "logps/rejected": -258.258544921875,
18
+ "loss": 0.6931,
19
  "rewards/accuracies": 0.0,
20
  "rewards/chosen": 0.0,
21
  "rewards/margins": 0.0,
22
  "rewards/rejected": 0.0,
23
  "step": 1
24
  },
25
+ {
26
+ "epoch": 0.62,
27
+ "learning_rate": 0.00021428571428571427,
28
+ "logits/chosen": -2.8371262550354004,
29
+ "logits/rejected": -2.8233795166015625,
30
+ "logps/chosen": -797.5036010742188,
31
+ "logps/rejected": -571.7381591796875,
32
+ "loss": 25.7534,
33
+ "rewards/accuracies": 0.3819444477558136,
34
+ "rewards/chosen": -54.44696807861328,
35
+ "rewards/margins": -20.015228271484375,
36
+ "rewards/rejected": -34.43173599243164,
37
+ "step": 10
38
+ },
39
  {
40
  "epoch": 1.0,
41
+ "eval_logits/chosen": -3.1348018646240234,
42
+ "eval_logits/rejected": -3.0953807830810547,
43
+ "eval_logps/chosen": -279.9947509765625,
44
+ "eval_logps/rejected": -279.706787109375,
45
+ "eval_loss": 0.947689950466156,
46
+ "eval_rewards/accuracies": 0.6944444179534912,
47
+ "eval_rewards/chosen": -3.136577844619751,
48
+ "eval_rewards/margins": 2.351809501647949,
49
+ "eval_rewards/rejected": -5.488387107849121,
50
+ "eval_runtime": 198.8798,
51
+ "eval_samples_per_second": 2.514,
52
+ "eval_steps_per_second": 0.317,
53
+ "step": 16
54
  },
55
  {
56
  "epoch": 1.0,
57
+ "step": 16,
58
  "total_flos": 0.0,
59
+ "train_loss": 19.057324022054672,
60
+ "train_runtime": 626.0842,
61
+ "train_samples_per_second": 0.799,
62
+ "train_steps_per_second": 0.026
63
  }
64
  ],
65
  "logging_steps": 10,
66
+ "max_steps": 16,
67
  "num_train_epochs": 1,
68
  "save_steps": 500,
69
  "total_flos": 0.0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1822fa9c0a896388f17c4a6fafc12ec68e5d9a0b52d64a949b92685ec29039db
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70f9924616298b428922bcac8ef53f857cc390c4cc29b39f72d9ef1110712bfd
3
  size 4792