SLM_vs_LLM_experiments
/
max_seq_length_128_experiments
/Qwen
/Qwen1.5_1.8B_amazon
/train_results.json
{ | |
"epoch": 1.0, | |
"train_loss": 1.0740083393297697, | |
"train_runtime": 415.974, | |
"train_samples": 12144, | |
"train_samples_per_second": 29.194, | |
"train_steps_per_second": 0.914 | |
} |