{ "epoch": 7.917525773195877, "eval_audio_cosine_sim": 0.5579971075057983, "eval_loss": 3.0988662242889404, "eval_runtime": 2019.3746, "eval_samples": 12, "eval_samples_per_second": 0.006, "eval_steps_per_second": 0.006, "eval_text_cosine_sim": 0.3821232318878174, "total_flos": 962957869218000.0, "train_loss": 8.716416617234549, "train_runtime": 7439.5895, "train_samples": 97, "train_samples_per_second": 0.104, "train_steps_per_second": 0.006 }