SLM_vs_LLM_experiments
/
max_seq_length_128_experiments
/Qwen
/Qwen1.5_1.8B_twitter
/eval_results.json
{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.7775735294117647, | |
"eval_f1_macro": 0.7420002194942226, | |
"eval_f1_micro": 0.7775735294117647, | |
"eval_loss": 0.5038631558418274, | |
"eval_runtime": 2.7898, | |
"eval_samples": 1088, | |
"eval_samples_per_second": 389.992, | |
"eval_steps_per_second": 12.187 | |
} |