--- license: openrail datasets: - HuggingFaceFW/fineweb - PleIAs/YouTube-Commons - HuggingFaceM4/the_cauldron - Anthropic/persuasion - allenai/WildChat-1M - mlabonne/orpo-dpo-mix-40k - m-a-p/COIG-CQIA - gretelai/synthetic_text_to_sql - PleIAs/Post-OCR-Correction - LooksJuicy/ruozhiba language: - pt metrics: - character - accuracy - bertscore - bleu - bleurt - brier_score - cer - charcut_mt - chrf - code_eval library_name: espnet pipeline_tag: audio-to-audio tags: - legal - chemistry - finance - biology - music - code ---