- adaptive_span
- backtranslation
- bart
- byte_level_bpe
- camembert
- constrained_decoding
- conv_seq2seq
- criss
- cross_lingual_language_model
- discriminative_reranking_nmt
- fast_noisy_channel
- flores101
- fully_sharded_data_parallel
- gottbert
- hubert
- joint_alignment_translation
- language_model
- laser
- latent_depth
- layerdrop
- linformer
- m2m_100
- mbart
- megatron_11b
- multilingual
- noisychannel
- nonautoregressive_translation
- paraphraser
- pay_less_attention_paper
- pointer_generator
- quant_noise
- roberta
- rxf
- scaling_nmt
- shuffled_word_order
- simultaneous_translation
- speech_recognition
- speech_synthesis
- speech_text_joint_to_text
- speech_to_text
- stories
- textless_nlp
- translation
- translation_moe
- truncated_bptt
- unsupervised_quality_estimation
- wav2vec
- wmt19
- wmt20
- xlmr