--- license: apache-2.0 datasets: - HuggingFaceFW/fineweb - m-a-p/COIG-CQIA - gretelai/synthetic_text_to_sql - PleIAs/YouTube-Commons - HuggingFaceM4/the_cauldron - Anthropic/persuasion - mlabonne/orpo-dpo-mix-40k - pixparse/idl-wds - HuggingFaceTB/cosmopedia - pixparse/pdfa-eng-wds language: - aa - ae metrics: - accuracy - bertscore - bleu - bleurt - brier_score - cer - character - charcut_mt - chrf - code_eval library_name: fasttext pipeline_tag: text-classification tags: - finance - not-for-all-audiences - legal ---