{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "be1c7379", "metadata": {}, "outputs": [], "source": [ "!pip install --quiet --root-user-action=ignore --upgrade pip\n", "!pip install --quiet --root-user-action=ignore \"datasets>=1.18.3\" \"transformers==4.11.3\" librosa jiwer huggingface_hub \n", "!pip install --quiet --root-user-action=ignore https://github.com/kpu/kenlm/archive/master.zip pyctcdecode\n", "!pip install --quiet --root-user-action=ignore --upgrade transformers\n", "!pip install --quiet --root-user-action=ignore torch_audiomentations audiomentations " ] }, { "cell_type": "code", "execution_count": 2, "id": "8892305a", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "Reusing dataset common_voice (/ai_data/cache/common_voice/de/6.1.0/a1dc74461f6c839bfe1e8cf1262fd4cf24297e3fbd4087a711bd090779023a5e)\n", "Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n" ] }, { "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "efc316d6eedb4dcab341dfd0fe8cc926", "version_major": 2, "version_minor": 0 }, "text/plain": [ " 0%| | 0/15588 [00:00