File size: 1,344 Bytes
eea2579
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
{
    "before_init_mem_cpu": 3802071040,
    "before_init_mem_gpu": 22016,
    "epoch": 0.9807355516637478,
    "eval_logits/chosen": -12.004097938537598,
    "eval_logits/rejected": -17.047502517700195,
    "eval_logps/chosen": -2.168222427368164,
    "eval_logps/rejected": -4.787535667419434,
    "eval_loss": 1.0162526369094849,
    "eval_mem_cpu_alloc_delta": 466944,
    "eval_mem_cpu_peaked_delta": 0,
    "eval_mem_gpu_alloc_delta": 0,
    "eval_mem_gpu_peaked_delta": 25220711424,
    "eval_rewards/accuracies": 0.9166666865348816,
    "eval_rewards/chosen": -21.682226181030273,
    "eval_rewards/margins": 26.193130493164062,
    "eval_rewards/rejected": -47.875362396240234,
    "eval_runtime": 9.9413,
    "eval_samples_per_second": 9.456,
    "eval_sft_loss": 0.01844729855656624,
    "eval_steps_per_second": 1.207,
    "init_mem_cpu_alloc_delta": 364544,
    "init_mem_cpu_peaked_delta": 0,
    "init_mem_gpu_alloc_delta": 0,
    "init_mem_gpu_peaked_delta": 0,
    "total_flos": 39867492466688.0,
    "train_loss": 3.085822834287371,
    "train_mem_cpu_alloc_delta": 5213659136,
    "train_mem_cpu_peaked_delta": 22737326080,
    "train_mem_gpu_alloc_delta": 16267848704,
    "train_mem_gpu_peaked_delta": 36029468160,
    "train_runtime": 1628.7465,
    "train_samples_per_second": 2.805,
    "train_steps_per_second": 0.021
}