{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "9074c90ec0f74bf29bf36d65ebba1b96": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_39038e915d234800bcaaa9b3895f1b68", "IPY_MODEL_6d3b0f9e6c494cbea42456b60b011564", "IPY_MODEL_831274f9a0ec40668ec7fcc5ac2771c3" ], "layout": "IPY_MODEL_8fa5eaaf1c8d4bc18ee076d33d563a0a" } }, "39038e915d234800bcaaa9b3895f1b68": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4a614b527a2a49789d41df08c3466764", "placeholder": "​", "style": "IPY_MODEL_30e7f062bc1b44a3a99363cb1a06fea9", "value": "Loading checkpoint shards:  33%" } }, "6d3b0f9e6c494cbea42456b60b011564": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_528eadb5cd604eb78b99b3781ad8a357", "max": 3, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_4f5a0839fd414dbaa5a2f6306cfa5ecc", "value": 1 } }, "831274f9a0ec40668ec7fcc5ac2771c3": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d44816c885194cef98b86893263b9b10", "placeholder": "​", "style": "IPY_MODEL_9c8da3b512bf414684a22b77d7fe48c6", "value": " 1/3 [00:33<01:06, 33.42s/it]" } }, "8fa5eaaf1c8d4bc18ee076d33d563a0a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4a614b527a2a49789d41df08c3466764": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "30e7f062bc1b44a3a99363cb1a06fea9": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "528eadb5cd604eb78b99b3781ad8a357": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4f5a0839fd414dbaa5a2f6306cfa5ecc": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "d44816c885194cef98b86893263b9b10": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "9c8da3b512bf414684a22b77d7fe48c6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "markdown", "source": [ "

OLMoE-1B-7B

" ], "metadata": { "id": "exGk3x7MxVMy" } }, { "cell_type": "markdown", "source": [ "The transformer library requires special install steps because the code that supports the OMOE models was only introduced in this [PR](https://github.com/huggingface/transformers/pull/32406).\n", "This code has not been updated on PYPI so we have to install it from source." ], "metadata": { "id": "t6IQl5rxrZDp" } }, { "cell_type": "code", "source": [ "!git init\n", "!git branch -m main" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "2AziwR7vq2bq", "outputId": "c2d1effa-0a73-420c-fffd-962424a9cefb" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\u001b[33mhint: Using 'master' as the name for the initial branch. This default branch name\u001b[m\n", "\u001b[33mhint: is subject to change. To configure the initial branch name to use in all\u001b[m\n", "\u001b[33mhint: of your new repositories, which will suppress this warning, call:\u001b[m\n", "\u001b[33mhint: \u001b[m\n", "\u001b[33mhint: \tgit config --global init.defaultBranch \u001b[m\n", "\u001b[33mhint: \u001b[m\n", "\u001b[33mhint: Names commonly chosen instead of 'master' are 'main', 'trunk' and\u001b[m\n", "\u001b[33mhint: 'development'. The just-created branch can be renamed via this command:\u001b[m\n", "\u001b[33mhint: \u001b[m\n", "\u001b[33mhint: \tgit branch -m \u001b[m\n", "Initialized empty Git repository in /content/.git/\n" ] } ] }, { "cell_type": "code", "source": [ "!export PR_NUMBER=32406" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "bqhf8TGhxvB9", "outputId": "101d77d0-5957-4534-b9a6-f3c794af86f2" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n" ] } ] }, { "cell_type": "code", "source": [ "!git remote add origin https://github.com/huggingface/transformers.git" ], "metadata": { "id": "PL3UBh06qo_C" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "7bitxdKMptwl", "outputId": "9c5016c2-b7ca-4477-e1f4-c896e5ca6f5a", "collapsed": true }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "remote: Enumerating objects: 188166, done.\u001b[K\n", "remote: Counting objects: 2% (1/47)\u001b[K\rremote: Counting objects: 4% (2/47)\u001b[K\rremote: Counting objects: 6% (3/47)\u001b[K\rremote: Counting objects: 8% (4/47)\u001b[K\rremote: Counting objects: 10% (5/47)\u001b[K\rremote: Counting objects: 12% (6/47)\u001b[K\rremote: Counting objects: 14% (7/47)\u001b[K\rremote: Counting objects: 17% (8/47)\u001b[K\rremote: Counting objects: 19% (9/47)\u001b[K\rremote: Counting objects: 21% (10/47)\u001b[K\rremote: Counting objects: 23% (11/47)\u001b[K\rremote: Counting objects: 25% (12/47)\u001b[K\rremote: Counting objects: 27% (13/47)\u001b[K\rremote: Counting objects: 29% (14/47)\u001b[K\rremote: Counting objects: 31% (15/47)\u001b[K\rremote: Counting objects: 34% (16/47)\u001b[K\rremote: Counting objects: 36% (17/47)\u001b[K\rremote: Counting objects: 38% (18/47)\u001b[K\rremote: Counting objects: 40% (19/47)\u001b[K\rremote: Counting objects: 42% (20/47)\u001b[K\rremote: Counting objects: 44% (21/47)\u001b[K\rremote: Counting objects: 46% (22/47)\u001b[K\rremote: Counting objects: 48% (23/47)\u001b[K\rremote: Counting objects: 51% (24/47)\u001b[K\rremote: Counting objects: 53% (25/47)\u001b[K\rremote: Counting objects: 55% (26/47)\u001b[K\rremote: Counting objects: 57% (27/47)\u001b[K\rremote: Counting objects: 59% (28/47)\u001b[K\rremote: Counting objects: 61% (29/47)\u001b[K\rremote: Counting objects: 63% (30/47)\u001b[K\rremote: Counting objects: 65% (31/47)\u001b[K\rremote: Counting objects: 68% (32/47)\u001b[K\rremote: Counting objects: 70% (33/47)\u001b[K\rremote: Counting objects: 72% (34/47)\u001b[K\rremote: Counting objects: 74% (35/47)\u001b[K\rremote: Counting objects: 76% (36/47)\u001b[K\rremote: Counting objects: 78% (37/47)\u001b[K\rremote: Counting objects: 80% (38/47)\u001b[K\rremote: Counting objects: 82% (39/47)\u001b[K\rremote: Counting objects: 85% (40/47)\u001b[K\rremote: Counting objects: 87% (41/47)\u001b[K\rremote: Counting objects: 89% (42/47)\u001b[K\rremote: Counting objects: 91% (43/47)\u001b[K\rremote: Counting objects: 93% (44/47)\u001b[K\rremote: Counting objects: 95% (45/47)\u001b[K\rremote: Counting objects: 97% (46/47)\u001b[K\rremote: Counting objects: 100% (47/47)\u001b[K\rremote: Counting objects: 100% (47/47), done.\u001b[K\n", "remote: Compressing objects: 100% (46/46), done.\u001b[K\n", "remote: Total 188166 (delta 1), reused 47 (delta 1), pack-reused 188119 (from 1)\u001b[K\n", "Receiving objects: 100% (188166/188166), 214.64 MiB | 20.89 MiB/s, done.\n", "Resolving deltas: 100% (134665/134665), done.\n", "From https://github.com/huggingface/transformers\n", " * [new ref] refs/pull/32406/head -> pr-32406\n", " * [new tag] 0.1.2 -> 0.1.2\n", " * [new tag] 0.5.0 -> 0.5.0\n", " * [new tag] 1.0 -> 1.0\n", " * [new tag] 1.1.0 -> 1.1.0\n", " * [new tag] 1.2.0 -> 1.2.0\n", " * [new tag] 3.0.1 -> 3.0.1\n", " * [new tag] 4.3.0.rc1 -> 4.3.0.rc1\n", " * [new tag] v0.1.2 -> v0.1.2\n", " * [new tag] v0.2.0 -> v0.2.0\n", " * [new tag] v0.3.0 -> v0.3.0\n", " * [new tag] v0.4.0 -> v0.4.0\n", " * [new tag] v0.5.0 -> v0.5.0\n", " * [new tag] v0.5.1 -> v0.5.1\n", " * [new tag] v0.6.0 -> v0.6.0\n", " * [new tag] v0.6.1 -> v0.6.1\n", " * [new tag] v0.6.2 -> v0.6.2\n", " * [new tag] v1.0.0 -> v1.0.0\n", " * [new tag] v2.0.0 -> v2.0.0\n", " * [new tag] v2.1.0 -> v2.1.0\n", " * [new tag] v2.1.1 -> v2.1.1\n", " * [new tag] v2.10.0 -> v2.10.0\n", " * [new tag] v2.11.0 -> v2.11.0\n", " * [new tag] v2.2.0 -> v2.2.0\n", " * [new tag] v2.2.1 -> v2.2.1\n", " * [new tag] v2.2.2 -> v2.2.2\n", " * [new tag] v2.3.0 -> v2.3.0\n", " * [new tag] v2.4.0 -> v2.4.0\n", " * [new tag] v2.4.1 -> v2.4.1\n", " * [new tag] v2.5.0 -> v2.5.0\n", " * [new tag] v2.5.1 -> v2.5.1\n", " * [new tag] v2.6.0 -> v2.6.0\n", " * [new tag] v2.7.0 -> v2.7.0\n", " * [new tag] v2.8.0 -> v2.8.0\n", " * [new tag] v2.9.0 -> v2.9.0\n", " * [new tag] v2.9.1 -> v2.9.1\n", " * [new tag] v3.0.0 -> v3.0.0\n", " * [new tag] v3.0.1 -> v3.0.1\n", " * [new tag] v3.0.2 -> v3.0.2\n", " * [new tag] v3.1.0 -> v3.1.0\n", " * [new tag] v3.2.0 -> v3.2.0\n", " * [new tag] v3.3.0 -> v3.3.0\n", " * [new tag] v3.3.1 -> v3.3.1\n", " * [new tag] v3.4.0 -> v3.4.0\n", " * [new tag] v3.5.0 -> v3.5.0\n", " * [new tag] v4.0.0-rc-1 -> v4.0.0-rc-1\n", " * [new tag] v4.1.0 -> v4.1.0\n", " * [new tag] v4.1.1 -> v4.1.1\n", " * [new tag] v4.10.0 -> v4.10.0\n", " * [new tag] v4.11.0 -> v4.11.0\n", " * [new tag] v4.12.0 -> v4.12.0\n", " * [new tag] v4.13.0 -> v4.13.0\n", " * [new tag] v4.14.0 -> v4.14.0\n", " * [new tag] v4.15.0 -> v4.15.0\n", " * [new tag] v4.16.0 -> v4.16.0\n", " * [new tag] v4.2.0 -> v4.2.0\n", " * [new tag] v4.3.0.rc1 -> v4.3.0.rc1\n", " * [new tag] v4.33.1 -> v4.33.1\n", " * [new tag] v4.4.0 -> v4.4.0\n", " * [new tag] v4.5.0 -> v4.5.0\n", " * [new tag] v4.6.0 -> v4.6.0\n", " * [new tag] v4.7.0 -> v4.7.0\n", " * [new tag] v4.8.0 -> v4.8.0\n", " * [new tag] v4.9.0 -> v4.9.0\n" ] } ], "source": [ "!git fetch origin pull/32406/head:pr-32406" ] }, { "cell_type": "code", "source": [ "!git checkout pr-32406" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "_s3Mt90Hqbbd", "outputId": "b8ac5e14-c28c-41f4-ba61-8e936497b125" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Updating files: 76% (3390/4452)\rUpdating files: 77% (3429/4452)\rUpdating files: 78% (3473/4452)\rUpdating files: 79% (3518/4452)\rUpdating files: 80% (3562/4452)\rUpdating files: 81% (3607/4452)\rUpdating files: 82% (3651/4452)\rUpdating files: 83% (3696/4452)\rUpdating files: 84% (3740/4452)\rUpdating files: 85% (3785/4452)\rUpdating files: 86% (3829/4452)\rUpdating files: 87% (3874/4452)\rUpdating files: 88% (3918/4452)\rUpdating files: 89% (3963/4452)\rUpdating files: 90% (4007/4452)\rUpdating files: 91% (4052/4452)\rUpdating files: 92% (4096/4452)\rUpdating files: 93% (4141/4452)\rUpdating files: 94% (4185/4452)\rUpdating files: 95% (4230/4452)\rUpdating files: 96% (4274/4452)\rUpdating files: 97% (4319/4452)\rUpdating files: 98% (4363/4452)\rUpdating files: 99% (4408/4452)\rUpdating files: 100% (4452/4452)\rUpdating files: 100% (4452/4452), done.\n", "Switched to branch 'pr-32406'\n" ] } ] }, { "cell_type": "code", "source": [ "!pip install -e .[all]" ], "metadata": { "id": "cq0YWuyxrQbf", "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "collapsed": true, "outputId": "9c6ea2e5-74f5-4f61-9043-215b7de2572e" }, "execution_count": 9, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Obtaining file:///content\n", " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Checking if build backend supports build_editable ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build editable ... \u001b[?25l\u001b[?25hdone\n", " Preparing editable metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (3.16.0)\n", "Requirement already satisfied: huggingface-hub<1.0,>=0.23.2 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.24.6)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (1.26.4)\n", "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (24.1)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (6.0.2)\n", "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (2024.5.15)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (2.32.3)\n", "Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.19.1)\n", "Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.4.5)\n", "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (4.66.5)\n", "Collecting tensorflow<2.16,>2.9 (from transformers==4.45.0.dev0)\n", " Downloading tensorflow-2.15.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (4.2 kB)\n", "Collecting onnxconverter-common (from transformers==4.45.0.dev0)\n", " Downloading onnxconverter_common-1.14.0-py2.py3-none-any.whl.metadata (4.2 kB)\n", "Collecting tf2onnx (from transformers==4.45.0.dev0)\n", " Downloading tf2onnx-1.16.1-py3-none-any.whl.metadata (1.3 kB)\n", "Collecting tensorflow-text<2.16 (from transformers==4.45.0.dev0)\n", " Downloading tensorflow_text-2.15.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (1.9 kB)\n", "Collecting keras-nlp<0.14.0,>=0.3.1 (from transformers==4.45.0.dev0)\n", " Downloading keras_nlp-0.12.1-py3-none-any.whl.metadata (6.8 kB)\n", "Requirement already satisfied: torch in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (2.4.0+cu121)\n", "Requirement already satisfied: accelerate>=0.26.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.34.2)\n", "Collecting jax<=0.4.13,>=0.4.1 (from transformers==4.45.0.dev0)\n", " Downloading jax-0.4.13.tar.gz (1.3 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m17.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Collecting jaxlib<=0.4.13,>=0.4.1 (from transformers==4.45.0.dev0)\n", " Downloading jaxlib-0.4.13-cp310-cp310-manylinux2014_x86_64.whl.metadata (2.1 kB)\n", "Collecting flax<=0.7.0,>=0.4.1 (from transformers==4.45.0.dev0)\n", " Downloading flax-0.7.0-py3-none-any.whl.metadata (9.9 kB)\n", "Collecting optax<=0.1.4,>=0.0.8 (from transformers==4.45.0.dev0)\n", " Downloading optax-0.1.4-py3-none-any.whl.metadata (12 kB)\n", "Collecting scipy<1.13.0 (from transformers==4.45.0.dev0)\n", " Downloading scipy-1.12.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (60 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.4/60.4 kB\u001b[0m \u001b[31m3.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: sentencepiece!=0.1.92,>=0.1.91 in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.1.99)\n", "Requirement already satisfied: protobuf in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (3.20.3)\n", "Requirement already satisfied: torchaudio in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (2.4.0+cu121)\n", "Requirement already satisfied: librosa in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.10.2.post1)\n", "Collecting pyctcdecode>=0.4.0 (from transformers==4.45.0.dev0)\n", " Downloading pyctcdecode-0.5.0-py2.py3-none-any.whl.metadata (20 kB)\n", "Collecting phonemizer (from transformers==4.45.0.dev0)\n", " Downloading phonemizer-3.3.0-py3-none-any.whl.metadata (48 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m48.2/48.2 kB\u001b[0m \u001b[31m3.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting kenlm (from transformers==4.45.0.dev0)\n", " Downloading kenlm-0.2.0.tar.gz (427 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m427.4/427.4 kB\u001b[0m \u001b[31m20.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Collecting Pillow<=15.0,>=10.0.1 (from transformers==4.45.0.dev0)\n", " Downloading pillow-10.4.0-cp310-cp310-manylinux_2_28_x86_64.whl.metadata (9.2 kB)\n", "Collecting optuna (from transformers==4.45.0.dev0)\n", " Downloading optuna-4.0.0-py3-none-any.whl.metadata (16 kB)\n", "Collecting ray>=2.7.0 (from ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0)\n", " Downloading ray-2.35.0-cp310-cp310-manylinux2014_x86_64.whl.metadata (16 kB)\n", "Collecting sigopt (from transformers==4.45.0.dev0)\n", " Downloading sigopt-8.8.3-py2.py3-none-any.whl.metadata (2.7 kB)\n", "Collecting timm<=0.9.16 (from transformers==4.45.0.dev0)\n", " Downloading timm-0.9.16-py3-none-any.whl.metadata (38 kB)\n", "Requirement already satisfied: torchvision in /usr/local/lib/python3.10/dist-packages (from transformers==4.45.0.dev0) (0.19.0+cu121)\n", "Collecting codecarbon==1.2.0 (from transformers==4.45.0.dev0)\n", " Downloading codecarbon-1.2.0-py3-none-any.whl.metadata (13 kB)\n", "Collecting decord==0.6.0 (from transformers==4.45.0.dev0)\n", " Downloading decord-0.6.0-py3-none-manylinux2010_x86_64.whl.metadata (422 bytes)\n", "Collecting av==9.2.0 (from transformers==4.45.0.dev0)\n", " Downloading av-9.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (4.5 kB)\n", "Collecting APScheduler (from codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading APScheduler-3.10.4-py3-none-any.whl.metadata (5.7 kB)\n", "Collecting dash (from codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading dash-2.18.1-py3-none-any.whl.metadata (10 kB)\n", "Collecting dash-bootstrap-components (from codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading dash_bootstrap_components-1.6.0-py3-none-any.whl.metadata (5.2 kB)\n", "Collecting fire (from codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading fire-0.6.0.tar.gz (88 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m88.4/88.4 kB\u001b[0m \u001b[31m5.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from codecarbon==1.2.0->transformers==4.45.0.dev0) (2.1.4)\n", "Collecting pynvml (from codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading pynvml-11.5.3-py3-none-any.whl.metadata (8.8 kB)\n", "Requirement already satisfied: py-cpuinfo in /usr/local/lib/python3.10/dist-packages (from codecarbon==1.2.0->transformers==4.45.0.dev0) (9.0.0)\n", "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.26.0->transformers==4.45.0.dev0) (5.9.5)\n", "Requirement already satisfied: msgpack in /usr/local/lib/python3.10/dist-packages (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (1.0.8)\n", "Requirement already satisfied: orbax-checkpoint in /usr/local/lib/python3.10/dist-packages (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (0.6.3)\n", "Requirement already satisfied: tensorstore in /usr/local/lib/python3.10/dist-packages (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (0.1.65)\n", "Requirement already satisfied: rich>=11.1 in /usr/local/lib/python3.10/dist-packages (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (13.8.1)\n", "Requirement already satisfied: typing-extensions>=4.1.1 in /usr/local/lib/python3.10/dist-packages (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (4.12.2)\n", "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.23.2->transformers==4.45.0.dev0) (2024.6.1)\n", "Requirement already satisfied: ml-dtypes>=0.1.0 in /usr/local/lib/python3.10/dist-packages (from jax<=0.4.13,>=0.4.1->transformers==4.45.0.dev0) (0.4.0)\n", "Requirement already satisfied: opt-einsum in /usr/local/lib/python3.10/dist-packages (from jax<=0.4.13,>=0.4.1->transformers==4.45.0.dev0) (3.3.0)\n", "Collecting keras-core (from keras-nlp<0.14.0,>=0.3.1->transformers==4.45.0.dev0)\n", " Downloading keras_core-0.1.7-py3-none-any.whl.metadata (4.3 kB)\n", "Requirement already satisfied: absl-py in /usr/local/lib/python3.10/dist-packages (from keras-nlp<0.14.0,>=0.3.1->transformers==4.45.0.dev0) (1.4.0)\n", "Requirement already satisfied: dm-tree in /usr/local/lib/python3.10/dist-packages (from keras-nlp<0.14.0,>=0.3.1->transformers==4.45.0.dev0) (0.1.8)\n", "Requirement already satisfied: kagglehub in /usr/local/lib/python3.10/dist-packages (from keras-nlp<0.14.0,>=0.3.1->transformers==4.45.0.dev0) (0.2.9)\n", "Requirement already satisfied: chex>=0.1.5 in /usr/local/lib/python3.10/dist-packages (from optax<=0.1.4,>=0.0.8->transformers==4.45.0.dev0) (0.1.86)\n", "Collecting pygtrie<3.0,>=2.1 (from pyctcdecode>=0.4.0->transformers==4.45.0.dev0)\n", " Downloading pygtrie-2.5.0-py3-none-any.whl.metadata (7.5 kB)\n", "Collecting hypothesis<7,>=6.14 (from pyctcdecode>=0.4.0->transformers==4.45.0.dev0)\n", " Downloading hypothesis-6.112.1-py3-none-any.whl.metadata (6.2 kB)\n", "Requirement already satisfied: click>=7.0 in /usr/local/lib/python3.10/dist-packages (from ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (8.1.7)\n", "Requirement already satisfied: jsonschema in /usr/local/lib/python3.10/dist-packages (from ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (4.23.0)\n", "Requirement already satisfied: aiosignal in /usr/local/lib/python3.10/dist-packages (from ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (1.3.1)\n", "Requirement already satisfied: frozenlist in /usr/local/lib/python3.10/dist-packages (from ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (1.4.1)\n", "Collecting tensorboardX>=1.9 (from ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0)\n", " Downloading tensorboardX-2.6.2.2-py2.py3-none-any.whl.metadata (5.8 kB)\n", "Requirement already satisfied: pyarrow>=6.0.1 in /usr/local/lib/python3.10/dist-packages (from ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (14.0.2)\n", "Requirement already satisfied: astunparse>=1.6.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (1.6.3)\n", "Requirement already satisfied: flatbuffers>=23.5.26 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (24.3.25)\n", "Requirement already satisfied: gast!=0.5.0,!=0.5.1,!=0.5.2,>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.6.0)\n", "Requirement already satisfied: google-pasta>=0.1.1 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.2.0)\n", "Requirement already satisfied: h5py>=2.9.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (3.11.0)\n", "Requirement already satisfied: libclang>=13.0.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (18.1.1)\n", "Collecting ml-dtypes>=0.1.0 (from jax<=0.4.13,>=0.4.1->transformers==4.45.0.dev0)\n", " Downloading ml_dtypes-0.3.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (20 kB)\n", "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (71.0.4)\n", "Requirement already satisfied: six>=1.12.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (1.16.0)\n", "Requirement already satisfied: termcolor>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (2.4.0)\n", "Collecting wrapt<1.15,>=1.11.0 (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0)\n", " Downloading wrapt-1.14.1-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (6.7 kB)\n", "Requirement already satisfied: tensorflow-io-gcs-filesystem>=0.23.1 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.37.1)\n", "Requirement already satisfied: grpcio<2.0,>=1.24.3 in /usr/local/lib/python3.10/dist-packages (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (1.64.1)\n", "Collecting tensorboard<2.16,>=2.15 (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0)\n", " Downloading tensorboard-2.15.2-py3-none-any.whl.metadata (1.7 kB)\n", "Collecting tensorflow-estimator<2.16,>=2.15.0 (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0)\n", " Downloading tensorflow_estimator-2.15.0-py2.py3-none-any.whl.metadata (1.3 kB)\n", "Collecting keras<2.16,>=2.15.0 (from tensorflow<2.16,>2.9->transformers==4.45.0.dev0)\n", " Downloading keras-2.15.0-py3-none-any.whl.metadata (2.4 kB)\n", "Requirement already satisfied: tensorflow-hub>=0.13.0 in /usr/local/lib/python3.10/dist-packages (from tensorflow-text<2.16->transformers==4.45.0.dev0) (0.16.1)\n", "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch->transformers==4.45.0.dev0) (1.13.2)\n", "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch->transformers==4.45.0.dev0) (3.3)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch->transformers==4.45.0.dev0) (3.1.4)\n", "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (3.0.1)\n", "Requirement already satisfied: scikit-learn>=0.20.0 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (1.3.2)\n", "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (1.4.2)\n", "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (4.4.2)\n", "Requirement already satisfied: numba>=0.51.0 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (0.60.0)\n", "Requirement already satisfied: soundfile>=0.12.1 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (0.12.1)\n", "Requirement already satisfied: pooch>=1.1 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (1.8.2)\n", "Requirement already satisfied: soxr>=0.3.2 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (0.5.0.post1)\n", "Requirement already satisfied: lazy-loader>=0.1 in /usr/local/lib/python3.10/dist-packages (from librosa->transformers==4.45.0.dev0) (0.4)\n", "Collecting onnx (from onnxconverter-common->transformers==4.45.0.dev0)\n", " Downloading onnx-1.16.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (16 kB)\n", "INFO: pip is looking at multiple versions of onnxconverter-common to determine which version is compatible with other requirements. This could take a while.\n", "Collecting onnxconverter-common (from transformers==4.45.0.dev0)\n", " Downloading onnxconverter_common-1.13.0-py2.py3-none-any.whl.metadata (2.6 kB)\n", "Collecting alembic>=1.5.0 (from optuna->transformers==4.45.0.dev0)\n", " Downloading alembic-1.13.2-py3-none-any.whl.metadata (7.4 kB)\n", "Collecting colorlog (from optuna->transformers==4.45.0.dev0)\n", " Downloading colorlog-6.8.2-py3-none-any.whl.metadata (10 kB)\n", "Requirement already satisfied: sqlalchemy>=1.3.0 in /usr/local/lib/python3.10/dist-packages (from optuna->transformers==4.45.0.dev0) (2.0.34)\n", "Collecting segments (from phonemizer->transformers==4.45.0.dev0)\n", " Downloading segments-2.2.1-py2.py3-none-any.whl.metadata (3.3 kB)\n", "Requirement already satisfied: attrs>=18.1 in /usr/local/lib/python3.10/dist-packages (from phonemizer->transformers==4.45.0.dev0) (24.2.0)\n", "Collecting dlinfo (from phonemizer->transformers==4.45.0.dev0)\n", " Downloading dlinfo-1.2.1-py3-none-any.whl.metadata (1.1 kB)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.45.0.dev0) (3.3.2)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.45.0.dev0) (3.8)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.45.0.dev0) (2.0.7)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.45.0.dev0) (2024.8.30)\n", "Collecting backoff<2.0.0,>=1.10.0 (from sigopt->transformers==4.45.0.dev0)\n", " Downloading backoff-1.11.1-py2.py3-none-any.whl.metadata (12 kB)\n", "Collecting GitPython>=2.0.0 (from sigopt->transformers==4.45.0.dev0)\n", " Downloading GitPython-3.1.43-py3-none-any.whl.metadata (13 kB)\n", "Collecting pypng>=0.0.20 (from sigopt->transformers==4.45.0.dev0)\n", " Downloading pypng-0.20220715.0-py3-none-any.whl.metadata (13 kB)\n", "Collecting urllib3<3,>=1.21.1 (from requests->transformers==4.45.0.dev0)\n", " Downloading urllib3-1.26.20-py2.py3-none-any.whl.metadata (50 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m50.1/50.1 kB\u001b[0m \u001b[31m3.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting Mako (from alembic>=1.5.0->optuna->transformers==4.45.0.dev0)\n", " Downloading Mako-1.3.5-py3-none-any.whl.metadata (2.9 kB)\n", "Requirement already satisfied: wheel<1.0,>=0.23.0 in /usr/local/lib/python3.10/dist-packages (from astunparse>=1.6.0->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.44.0)\n", "INFO: pip is looking at multiple versions of chex to determine which version is compatible with other requirements. This could take a while.\n", "Collecting chex>=0.1.5 (from optax<=0.1.4,>=0.0.8->transformers==4.45.0.dev0)\n", " Downloading chex-0.1.85-py3-none-any.whl.metadata (17 kB)\n", " Downloading chex-0.1.84-py3-none-any.whl.metadata (17 kB)\n", " Downloading chex-0.1.83-py3-none-any.whl.metadata (17 kB)\n", " Downloading chex-0.1.82-py3-none-any.whl.metadata (17 kB)\n", "Requirement already satisfied: toolz>=0.9.0 in /usr/local/lib/python3.10/dist-packages (from chex>=0.1.5->optax<=0.1.4,>=0.0.8->transformers==4.45.0.dev0) (0.12.1)\n", "Collecting gitdb<5,>=4.0.1 (from GitPython>=2.0.0->sigopt->transformers==4.45.0.dev0)\n", " Downloading gitdb-4.0.11-py3-none-any.whl.metadata (1.2 kB)\n", "Requirement already satisfied: sortedcontainers<3.0.0,>=2.1.0 in /usr/local/lib/python3.10/dist-packages (from hypothesis<7,>=6.14->pyctcdecode>=0.4.0->transformers==4.45.0.dev0) (2.4.0)\n", "Requirement already satisfied: exceptiongroup>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from hypothesis<7,>=6.14->pyctcdecode>=0.4.0->transformers==4.45.0.dev0) (1.2.2)\n", "Requirement already satisfied: llvmlite<0.44,>=0.43.0dev0 in /usr/local/lib/python3.10/dist-packages (from numba>=0.51.0->librosa->transformers==4.45.0.dev0) (0.43.0)\n", "Requirement already satisfied: platformdirs>=2.5.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.1->librosa->transformers==4.45.0.dev0) (4.3.2)\n", "Requirement already satisfied: markdown-it-py>=2.2.0 in /usr/local/lib/python3.10/dist-packages (from rich>=11.1->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (3.0.0)\n", "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from rich>=11.1->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (2.16.1)\n", "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.20.0->librosa->transformers==4.45.0.dev0) (3.5.0)\n", "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from soundfile>=0.12.1->librosa->transformers==4.45.0.dev0) (1.17.1)\n", "Requirement already satisfied: greenlet!=0.4.17 in /usr/local/lib/python3.10/dist-packages (from sqlalchemy>=1.3.0->optuna->transformers==4.45.0.dev0) (3.1.0)\n", "Requirement already satisfied: google-auth<3,>=1.6.3 in /usr/local/lib/python3.10/dist-packages (from tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (2.27.0)\n", "Requirement already satisfied: google-auth-oauthlib<2,>=0.5 in /usr/local/lib/python3.10/dist-packages (from tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (1.2.1)\n", "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.10/dist-packages (from tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (3.7)\n", "Requirement already satisfied: tensorboard-data-server<0.8.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.7.2)\n", "Requirement already satisfied: werkzeug>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (3.0.4)\n", "Requirement already satisfied: tf-keras>=2.14.1 in /usr/local/lib/python3.10/dist-packages (from tensorflow-hub>=0.13.0->tensorflow-text<2.16->transformers==4.45.0.dev0) (2.17.0)\n", "Requirement already satisfied: pytz in /usr/local/lib/python3.10/dist-packages (from APScheduler->codecarbon==1.2.0->transformers==4.45.0.dev0) (2024.2)\n", "Requirement already satisfied: tzlocal!=3.*,>=2.0 in /usr/local/lib/python3.10/dist-packages (from APScheduler->codecarbon==1.2.0->transformers==4.45.0.dev0) (5.2)\n", "Requirement already satisfied: Flask<3.1,>=1.0.4 in /usr/local/lib/python3.10/dist-packages (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (2.2.5)\n", "Requirement already satisfied: plotly>=5.0.0 in /usr/local/lib/python3.10/dist-packages (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (5.15.0)\n", "Collecting dash-html-components==2.0.0 (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading dash_html_components-2.0.0-py3-none-any.whl.metadata (3.8 kB)\n", "Collecting dash-core-components==2.0.0 (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading dash_core_components-2.0.0-py3-none-any.whl.metadata (2.9 kB)\n", "Collecting dash-table==5.0.0 (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading dash_table-5.0.0-py3-none-any.whl.metadata (2.4 kB)\n", "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.10/dist-packages (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (8.5.0)\n", "Collecting retrying (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0)\n", " Downloading retrying-1.3.4-py3-none-any.whl.metadata (6.9 kB)\n", "Requirement already satisfied: nest-asyncio in /usr/local/lib/python3.10/dist-packages (from dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (1.6.0)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch->transformers==4.45.0.dev0) (2.1.5)\n", "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema->ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (2023.12.1)\n", "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema->ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (0.35.1)\n", "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema->ray>=2.7.0->ray[tune]>=2.7.0; extra == \"all\"->transformers==4.45.0.dev0) (0.20.0)\n", "Requirement already satisfied: namex in /usr/local/lib/python3.10/dist-packages (from keras-core->keras-nlp<0.14.0,>=0.3.1->transformers==4.45.0.dev0) (0.0.8)\n", "Requirement already satisfied: etils[epath,epy] in /usr/local/lib/python3.10/dist-packages (from orbax-checkpoint->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (1.9.4)\n", "INFO: pip is looking at multiple versions of orbax-checkpoint to determine which version is compatible with other requirements. This could take a while.\n", "Collecting orbax-checkpoint (from flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0)\n", " Downloading orbax_checkpoint-0.6.2-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.6.1-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.6.0-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.23-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.22-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.21-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.20-py3-none-any.whl.metadata (1.8 kB)\n", "INFO: pip is still looking at multiple versions of orbax-checkpoint to determine which version is compatible with other requirements. This could take a while.\n", " Downloading orbax_checkpoint-0.5.19-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.18-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.17-py3-none-any.whl.metadata (1.8 kB)\n", " Downloading orbax_checkpoint-0.5.16-py3-none-any.whl.metadata (1.8 kB)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas->codecarbon==1.2.0->transformers==4.45.0.dev0) (2.8.2)\n", "Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas->codecarbon==1.2.0->transformers==4.45.0.dev0) (2024.1)\n", "Collecting clldutils>=1.7.3 (from segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading clldutils-3.22.2-py2.py3-none-any.whl.metadata (3.0 kB)\n", "Collecting csvw>=1.5.6 (from segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading csvw-3.3.1-py2.py3-none-any.whl.metadata (10 kB)\n", "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from sympy->torch->transformers==4.45.0.dev0) (1.3.0)\n", "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->soundfile>=0.12.1->librosa->transformers==4.45.0.dev0) (2.22)\n", "Requirement already satisfied: tabulate>=0.7.7 in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->transformers==4.45.0.dev0) (0.9.0)\n", "Collecting bibtexparser>=2.0.0b4 (from clldutils>=1.7.3->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading bibtexparser-2.0.0b7-py3-none-any.whl.metadata (5.6 kB)\n", "Collecting pylatexenc (from clldutils>=1.7.3->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading pylatexenc-2.10.tar.gz (162 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m162.6/162.6 kB\u001b[0m \u001b[31m9.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: lxml in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->transformers==4.45.0.dev0) (4.9.4)\n", "Requirement already satisfied: babel in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0) (2.16.0)\n", "Collecting colorama (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading colorama-0.4.6-py2.py3-none-any.whl.metadata (17 kB)\n", "Collecting isodate (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading isodate-0.6.1-py2.py3-none-any.whl.metadata (9.6 kB)\n", "Collecting language-tags (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading language_tags-1.2.0-py3-none-any.whl.metadata (2.1 kB)\n", "Collecting rdflib (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading rdflib-7.0.0-py3-none-any.whl.metadata (11 kB)\n", "Collecting rfc3986<2 (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0)\n", " Downloading rfc3986-1.5.0-py2.py3-none-any.whl.metadata (6.5 kB)\n", "Requirement already satisfied: uritemplate>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0) (4.1.1)\n", "Requirement already satisfied: itsdangerous>=2.0 in /usr/local/lib/python3.10/dist-packages (from Flask<3.1,>=1.0.4->dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (2.2.0)\n", "Collecting smmap<6,>=3.0.1 (from gitdb<5,>=4.0.1->GitPython>=2.0.0->sigopt->transformers==4.45.0.dev0)\n", " Downloading smmap-5.0.1-py3-none-any.whl.metadata (4.3 kB)\n", "Requirement already satisfied: cachetools<6.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (5.5.0)\n", "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.4.1)\n", "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (4.9)\n", "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from google-auth-oauthlib<2,>=0.5->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (1.3.1)\n", "Requirement already satisfied: mdurl~=0.1 in /usr/local/lib/python3.10/dist-packages (from markdown-it-py>=2.2.0->rich>=11.1->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (0.1.2)\n", "Requirement already satisfied: tenacity>=6.2.0 in /usr/local/lib/python3.10/dist-packages (from plotly>=5.0.0->dash->codecarbon==1.2.0->transformers==4.45.0.dev0) (9.0.0)\n", "INFO: pip is looking at multiple versions of tf-keras to determine which version is compatible with other requirements. This could take a while.\n", "Collecting tf-keras>=2.14.1 (from tensorflow-hub>=0.13.0->tensorflow-text<2.16->transformers==4.45.0.dev0)\n", " Downloading tf_keras-2.16.0-py3-none-any.whl.metadata (1.6 kB)\n", " Downloading tf_keras-2.15.1-py3-none-any.whl.metadata (1.7 kB)\n", "Requirement already satisfied: importlib_resources in /usr/local/lib/python3.10/dist-packages (from etils[epath,epy]->orbax-checkpoint->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (6.4.5)\n", "Requirement already satisfied: zipp in /usr/local/lib/python3.10/dist-packages (from etils[epath,epy]->orbax-checkpoint->flax<=0.7.0,>=0.4.1->transformers==4.45.0.dev0) (3.20.1)\n", "Requirement already satisfied: pyasn1<0.7.0,>=0.4.6 in /usr/local/lib/python3.10/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3,>=1.6.3->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (0.6.1)\n", "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<2,>=0.5->tensorboard<2.16,>=2.15->tensorflow<2.16,>2.9->transformers==4.45.0.dev0) (3.2.2)\n", "Requirement already satisfied: pyparsing<4,>=2.1.0 in /usr/local/lib/python3.10/dist-packages (from rdflib->csvw>=1.5.6->segments->phonemizer->transformers==4.45.0.dev0) (3.1.4)\n", "Downloading av-9.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (28.8 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m28.8/28.8 MB\u001b[0m \u001b[31m17.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading codecarbon-1.2.0-py3-none-any.whl (135 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m135.0/135.0 kB\u001b[0m \u001b[31m8.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading decord-0.6.0-py3-none-manylinux2010_x86_64.whl (13.6 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m13.6/13.6 MB\u001b[0m \u001b[31m75.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading flax-0.7.0-py3-none-any.whl (225 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m225.9/225.9 kB\u001b[0m \u001b[31m14.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading jaxlib-0.4.13-cp310-cp310-manylinux2014_x86_64.whl (71.6 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m71.6/71.6 MB\u001b[0m \u001b[31m7.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading keras_nlp-0.12.1-py3-none-any.whl (570 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m570.5/570.5 kB\u001b[0m \u001b[31m31.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading optax-0.1.4-py3-none-any.whl (154 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.9/154.9 kB\u001b[0m \u001b[31m10.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading pillow-10.4.0-cp310-cp310-manylinux_2_28_x86_64.whl (4.5 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m4.5/4.5 MB\u001b[0m \u001b[31m83.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading pyctcdecode-0.5.0-py2.py3-none-any.whl (39 kB)\n", "Downloading ray-2.35.0-cp310-cp310-manylinux2014_x86_64.whl (65.0 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m65.0/65.0 MB\u001b[0m \u001b[31m10.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading scipy-1.12.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (38.4 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m38.4/38.4 MB\u001b[0m \u001b[31m18.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tensorflow-2.15.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (475.2 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m475.2/475.2 MB\u001b[0m \u001b[31m1.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tensorflow_text-2.15.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (5.2 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m5.2/5.2 MB\u001b[0m \u001b[31m57.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading timm-0.9.16-py3-none-any.whl (2.2 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.2/2.2 MB\u001b[0m \u001b[31m49.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading onnxconverter_common-1.13.0-py2.py3-none-any.whl (83 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m83.8/83.8 kB\u001b[0m \u001b[31m6.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading optuna-4.0.0-py3-none-any.whl (362 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m362.8/362.8 kB\u001b[0m \u001b[31m22.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading phonemizer-3.3.0-py3-none-any.whl (103 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.8/103.8 kB\u001b[0m \u001b[31m8.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading sigopt-8.8.3-py2.py3-none-any.whl (198 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m198.8/198.8 kB\u001b[0m \u001b[31m7.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tf2onnx-1.16.1-py3-none-any.whl (455 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m455.8/455.8 kB\u001b[0m \u001b[31m27.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading alembic-1.13.2-py3-none-any.whl (232 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m233.0/233.0 kB\u001b[0m \u001b[31m15.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading backoff-1.11.1-py2.py3-none-any.whl (13 kB)\n", "Downloading chex-0.1.82-py3-none-any.whl (94 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m94.8/94.8 kB\u001b[0m \u001b[31m6.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading GitPython-3.1.43-py3-none-any.whl (207 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m207.3/207.3 kB\u001b[0m \u001b[31m14.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading hypothesis-6.112.1-py3-none-any.whl (467 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m467.5/467.5 kB\u001b[0m \u001b[31m26.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading keras-2.15.0-py3-none-any.whl (1.7 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.7/1.7 MB\u001b[0m \u001b[31m46.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading ml_dtypes-0.3.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (2.2 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.2/2.2 MB\u001b[0m \u001b[31m47.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading onnx-1.16.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (15.9 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m15.9/15.9 MB\u001b[0m \u001b[31m84.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading pygtrie-2.5.0-py3-none-any.whl (25 kB)\n", "Downloading pypng-0.20220715.0-py3-none-any.whl (58 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.1/58.1 kB\u001b[0m \u001b[31m4.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tensorboard-2.15.2-py3-none-any.whl (5.5 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m5.5/5.5 MB\u001b[0m \u001b[31m95.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tensorboardX-2.6.2.2-py2.py3-none-any.whl (101 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m101.7/101.7 kB\u001b[0m \u001b[31m7.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tensorflow_estimator-2.15.0-py2.py3-none-any.whl (441 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m442.0/442.0 kB\u001b[0m \u001b[31m22.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading urllib3-1.26.20-py2.py3-none-any.whl (144 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.2/144.2 kB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading wrapt-1.14.1-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (77 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m77.9/77.9 kB\u001b[0m \u001b[31m5.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading APScheduler-3.10.4-py3-none-any.whl (59 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m59.3/59.3 kB\u001b[0m \u001b[31m4.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading colorlog-6.8.2-py3-none-any.whl (11 kB)\n", "Downloading dash-2.18.1-py3-none-any.whl (7.5 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.5/7.5 MB\u001b[0m \u001b[31m64.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading dash_core_components-2.0.0-py3-none-any.whl (3.8 kB)\n", "Downloading dash_html_components-2.0.0-py3-none-any.whl (4.1 kB)\n", "Downloading dash_table-5.0.0-py3-none-any.whl (3.9 kB)\n", "Downloading dash_bootstrap_components-1.6.0-py3-none-any.whl (222 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m222.5/222.5 kB\u001b[0m \u001b[31m15.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading dlinfo-1.2.1-py3-none-any.whl (3.6 kB)\n", "Downloading keras_core-0.1.7-py3-none-any.whl (950 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m950.8/950.8 kB\u001b[0m \u001b[31m36.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading orbax_checkpoint-0.5.16-py3-none-any.whl (217 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m217.0/217.0 kB\u001b[0m \u001b[31m15.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading pynvml-11.5.3-py3-none-any.whl (53 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m53.1/53.1 kB\u001b[0m \u001b[31m3.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading segments-2.2.1-py2.py3-none-any.whl (15 kB)\n", "Downloading clldutils-3.22.2-py2.py3-none-any.whl (1.7 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.7/1.7 MB\u001b[0m \u001b[31m45.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading csvw-3.3.1-py2.py3-none-any.whl (57 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m57.9/57.9 kB\u001b[0m \u001b[31m4.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading gitdb-4.0.11-py3-none-any.whl (62 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.7/62.7 kB\u001b[0m \u001b[31m4.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading tf_keras-2.15.1-py3-none-any.whl (1.7 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.7/1.7 MB\u001b[0m \u001b[31m32.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading Mako-1.3.5-py3-none-any.whl (78 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m78.6/78.6 kB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading retrying-1.3.4-py3-none-any.whl (11 kB)\n", "Downloading bibtexparser-2.0.0b7-py3-none-any.whl (38 kB)\n", "Downloading rfc3986-1.5.0-py2.py3-none-any.whl (31 kB)\n", "Downloading smmap-5.0.1-py3-none-any.whl (24 kB)\n", "Downloading colorama-0.4.6-py2.py3-none-any.whl (25 kB)\n", "Downloading isodate-0.6.1-py2.py3-none-any.whl (41 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m41.7/41.7 kB\u001b[0m \u001b[31m2.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading language_tags-1.2.0-py3-none-any.whl (213 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.4/213.4 kB\u001b[0m \u001b[31m13.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hDownloading rdflib-7.0.0-py3-none-any.whl (531 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m531.9/531.9 kB\u001b[0m \u001b[31m26.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hBuilding wheels for collected packages: transformers, jax, kenlm, fire, pylatexenc\n", " Building editable for transformers (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for transformers: filename=transformers-4.45.0.dev0-0.editable-py3-none-any.whl size=17235 sha256=47f8d7fd33fbf68a16dcdf9eb478de0330868e96b41dddcaa2e90ce820af3d0c\n", " Stored in directory: /tmp/pip-ephem-wheel-cache-4a6k3c9o/wheels/e8/d3/96/0e8c7135806cbda4db28d12fc8d710e5e4f66ced1411163e67\n", " Building wheel for jax (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for jax: filename=jax-0.4.13-py3-none-any.whl size=1518703 sha256=696a457ee4a211a88e694e2ebf08a4f507a8a30771990bfddfe138813b2c9365\n", " Stored in directory: /root/.cache/pip/wheels/f3/7a/25/f297f69029b5e4064e4736a0c4b3996a44cc27781c120bcb99\n", " Building wheel for kenlm (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for kenlm: filename=kenlm-0.2.0-cp310-cp310-linux_x86_64.whl size=3184429 sha256=13f3f18abd6e36cd73d41e00a8f62353ba919d0dc6283b26d233ce3d7a001263\n", " Stored in directory: /root/.cache/pip/wheels/fd/80/e0/18f4148e863fb137bd87e21ee2bf423b81b3ed6989dab95135\n", " Building wheel for fire (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for fire: filename=fire-0.6.0-py2.py3-none-any.whl size=117030 sha256=663b80270e4bec0b4b2a2170c8587b95783f5bb0683d5e2d919836b362b8e838\n", " Stored in directory: /root/.cache/pip/wheels/d6/6d/5d/5b73fa0f46d01a793713f8859201361e9e581ced8c75e5c6a3\n", " Building wheel for pylatexenc (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for pylatexenc: filename=pylatexenc-2.10-py3-none-any.whl size=136817 sha256=ac148679a22a494d8e13b2f1d3c8edf4753a07b4a509bdc91ede1fac56069ade\n", " Stored in directory: /root/.cache/pip/wheels/d3/31/8b/e09b0386afd80cfc556c00408c9aeea5c35c4d484a9c762fd5\n", "Successfully built transformers jax kenlm fire pylatexenc\n", "Installing collected packages: rfc3986, pypng, pylatexenc, pygtrie, language-tags, kenlm, dlinfo, dash-table, dash-html-components, dash-core-components, av, wrapt, urllib3, tensorflow-estimator, tensorboardX, smmap, scipy, retrying, pynvml, Pillow, onnx, ml-dtypes, Mako, keras, isodate, hypothesis, fire, decord, colorlog, colorama, bibtexparser, backoff, APScheduler, rdflib, pyctcdecode, onnxconverter-common, jaxlib, jax, gitdb, clldutils, alembic, tf2onnx, orbax-checkpoint, optuna, keras-core, GitPython, dash, chex, timm, sigopt, ray, optax, dash-bootstrap-components, csvw, transformers, tensorboard, segments, flax, codecarbon, tensorflow, phonemizer, tf-keras, tensorflow-text, keras-nlp\n", " Attempting uninstall: wrapt\n", " Found existing installation: wrapt 1.16.0\n", " Uninstalling wrapt-1.16.0:\n", " Successfully uninstalled wrapt-1.16.0\n", " Attempting uninstall: urllib3\n", " Found existing installation: urllib3 2.0.7\n", " Uninstalling urllib3-2.0.7:\n", " Successfully uninstalled urllib3-2.0.7\n", " Attempting uninstall: scipy\n", " Found existing installation: scipy 1.13.1\n", " Uninstalling scipy-1.13.1:\n", " Successfully uninstalled scipy-1.13.1\n", " Attempting uninstall: Pillow\n", " Found existing installation: Pillow 9.4.0\n", " Uninstalling Pillow-9.4.0:\n", " Successfully uninstalled Pillow-9.4.0\n", " Attempting uninstall: ml-dtypes\n", " Found existing installation: ml-dtypes 0.4.0\n", " Uninstalling ml-dtypes-0.4.0:\n", " Successfully uninstalled ml-dtypes-0.4.0\n", " Attempting uninstall: keras\n", " Found existing installation: keras 3.4.1\n", " Uninstalling keras-3.4.1:\n", " Successfully uninstalled keras-3.4.1\n", " Attempting uninstall: jaxlib\n", " Found existing installation: jaxlib 0.4.26+cuda12.cudnn89\n", " Uninstalling jaxlib-0.4.26+cuda12.cudnn89:\n", " Successfully uninstalled jaxlib-0.4.26+cuda12.cudnn89\n", " Attempting uninstall: jax\n", " Found existing installation: jax 0.4.26\n", " Uninstalling jax-0.4.26:\n", " Successfully uninstalled jax-0.4.26\n", " Attempting uninstall: orbax-checkpoint\n", " Found existing installation: orbax-checkpoint 0.6.3\n", " Uninstalling orbax-checkpoint-0.6.3:\n", " Successfully uninstalled orbax-checkpoint-0.6.3\n", " Attempting uninstall: chex\n", " Found existing installation: chex 0.1.86\n", " Uninstalling chex-0.1.86:\n", " Successfully uninstalled chex-0.1.86\n", " Attempting uninstall: optax\n", " Found existing installation: optax 0.2.2\n", " Uninstalling optax-0.2.2:\n", " Successfully uninstalled optax-0.2.2\n", " Attempting uninstall: transformers\n", " Found existing installation: transformers 4.44.2\n", " Uninstalling transformers-4.44.2:\n", " Successfully uninstalled transformers-4.44.2\n", " Attempting uninstall: tensorboard\n", " Found existing installation: tensorboard 2.17.0\n", " Uninstalling tensorboard-2.17.0:\n", " Successfully uninstalled tensorboard-2.17.0\n", " Attempting uninstall: flax\n", " Found existing installation: flax 0.8.4\n", " Uninstalling flax-0.8.4:\n", " Successfully uninstalled flax-0.8.4\n", " Attempting uninstall: tensorflow\n", " Found existing installation: tensorflow 2.17.0\n", " Uninstalling tensorflow-2.17.0:\n", " Successfully uninstalled tensorflow-2.17.0\n", " Attempting uninstall: tf-keras\n", " Found existing installation: tf_keras 2.17.0\n", " Uninstalling tf_keras-2.17.0:\n", " Successfully uninstalled tf_keras-2.17.0\n", "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", "osqp 0.6.7.post0 requires scipy!=1.12.0,>=0.13.2, but you have scipy 1.12.0 which is incompatible.\u001b[0m\u001b[31m\n", "\u001b[0mSuccessfully installed APScheduler-3.10.4 GitPython-3.1.43 Mako-1.3.5 Pillow-10.4.0 alembic-1.13.2 av-9.2.0 backoff-1.11.1 bibtexparser-2.0.0b7 chex-0.1.82 clldutils-3.22.2 codecarbon-1.2.0 colorama-0.4.6 colorlog-6.8.2 csvw-3.3.1 dash-2.18.1 dash-bootstrap-components-1.6.0 dash-core-components-2.0.0 dash-html-components-2.0.0 dash-table-5.0.0 decord-0.6.0 dlinfo-1.2.1 fire-0.6.0 flax-0.7.0 gitdb-4.0.11 hypothesis-6.112.1 isodate-0.6.1 jax-0.4.13 jaxlib-0.4.13 kenlm-0.2.0 keras-2.15.0 keras-core-0.1.7 keras-nlp-0.12.1 language-tags-1.2.0 ml-dtypes-0.3.2 onnx-1.16.2 onnxconverter-common-1.13.0 optax-0.1.4 optuna-4.0.0 orbax-checkpoint-0.5.16 phonemizer-3.3.0 pyctcdecode-0.5.0 pygtrie-2.5.0 pylatexenc-2.10 pynvml-11.5.3 pypng-0.20220715.0 ray-2.35.0 rdflib-7.0.0 retrying-1.3.4 rfc3986-1.5.0 scipy-1.12.0 segments-2.2.1 sigopt-8.8.3 smmap-5.0.1 tensorboard-2.15.2 tensorboardX-2.6.2.2 tensorflow-2.15.1 tensorflow-estimator-2.15.0 tensorflow-text-2.15.0 tf-keras-2.15.1 tf2onnx-1.16.1 timm-0.9.16 transformers-4.45.0.dev0 urllib3-1.26.20 wrapt-1.14.1\n" ] }, { "output_type": "display_data", "data": { "application/vnd.colab-display-data+json": { "pip_warning": { "packages": [ "PIL" ] }, "id": "13f986199d30470480155a0a26153ae8" } }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "from transformers import OlmoeForCausalLM, AutoTokenizer" ], "metadata": { "id": "ijEEXUXztzXD" }, "execution_count": 6, "outputs": [] }, { "cell_type": "code", "source": [ "import torch" ], "metadata": { "id": "3sUL_mpAvywU" }, "execution_count": 5, "outputs": [] }, { "cell_type": "code", "source": [ "DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n", "\n", "# Load different ckpts via passing e.g. `revision=step10000-tokens41B`\n", "model = OlmoeForCausalLM.from_pretrained(\"allenai/OLMoE-1B-7B-0924\").to(DEVICE)\n", "tokenizer = AutoTokenizer.from_pretrained(\"allenai/OLMoE-1B-7B-0924\")\n", "inputs = tokenizer(\"Bitcoin is\", return_tensors=\"pt\")\n", "inputs = {k: v.to(DEVICE) for k, v in inputs.items()}\n", "out = model.generate(**inputs, max_length=64)\n", "print(tokenizer.decode(out[0]))" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 49, "referenced_widgets": [ "9074c90ec0f74bf29bf36d65ebba1b96", "39038e915d234800bcaaa9b3895f1b68", "6d3b0f9e6c494cbea42456b60b011564", "831274f9a0ec40668ec7fcc5ac2771c3", "8fa5eaaf1c8d4bc18ee076d33d563a0a", "4a614b527a2a49789d41df08c3466764", "30e7f062bc1b44a3a99363cb1a06fea9", "528eadb5cd604eb78b99b3781ad8a357", "4f5a0839fd414dbaa5a2f6306cfa5ecc", "d44816c885194cef98b86893263b9b10", "9c8da3b512bf414684a22b77d7fe48c6" ] }, "id": "Kj8Ti_I_wcvc", "outputId": "4419620d-f678-4f1c-9e27-593298f9c0ed" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Loading checkpoint shards: 0%| | 0/3 [00:00