{ "data": [ { "wav": "path_to_audio_file", "caption": "textual_desciptions" } ] }