{ "cells": [ { "cell_type": "code", "source": [ "%pip install huggingface_hub httpx tqdm --upgrade" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "pCPC0RUTOt7i", "outputId": "2dff92e3-a9ae-4ef8-e47b-24f754556a01" }, "execution_count": 1, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Collecting huggingface_hub\n", " Downloading huggingface_hub-0.17.2-py3-none-any.whl (294 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m294.9/294.9 kB\u001b[0m \u001b[31m4.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting httpx\n", " Downloading httpx-0.25.0-py3-none-any.whl (75 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m75.7/75.7 kB\u001b[0m \u001b[31m7.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (4.66.1)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (3.12.2)\n", "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (2023.6.0)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (2.31.0)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (6.0.1)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (4.5.0)\n", "Requirement already satisfied: packaging>=20.9 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub) (23.1)\n", "Requirement already satisfied: certifi in /usr/local/lib/python3.10/dist-packages (from httpx) (2023.7.22)\n", "Collecting httpcore<0.19.0,>=0.18.0 (from httpx)\n", " Downloading httpcore-0.18.0-py3-none-any.whl (76 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m76.0/76.0 kB\u001b[0m \u001b[31m5.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: idna in /usr/local/lib/python3.10/dist-packages (from httpx) (3.4)\n", "Requirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from httpx) (1.3.0)\n", "Requirement already satisfied: anyio<5.0,>=3.0 in /usr/local/lib/python3.10/dist-packages (from httpcore<0.19.0,>=0.18.0->httpx) (3.7.1)\n", "Collecting h11<0.15,>=0.13 (from httpcore<0.19.0,>=0.18.0->httpx)\n", " Downloading h11-0.14.0-py3-none-any.whl (58 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.3/58.3 kB\u001b[0m \u001b[31m6.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub) (3.2.0)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub) (2.0.4)\n", "Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio<5.0,>=3.0->httpcore<0.19.0,>=0.18.0->httpx) (1.1.3)\n", "Installing collected packages: h11, huggingface_hub, httpcore, httpx\n", "Successfully installed h11-0.14.0 httpcore-0.18.0 httpx-0.25.0 huggingface_hub-0.17.2\n" ] } ] }, { "cell_type": "code", "execution_count": 27, "metadata": { "id": "borSZCgAOfOo" }, "outputs": [], "source": [ "import httpx\n", "from huggingface_hub import list_models, ModelFilter, hf_hub_url\n", "import pandas as pd\n", "from tqdm.contrib.concurrent import thread_map\n", "from huggingface_hub import model_info\n", "from tqdm.auto import tqdm" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "d0cwY4nNOfOo", "outputId": "a65725ea-97a1-4cb4-de1d-5cf0876ca4ab" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "6981" ] }, "metadata": {}, "execution_count": 3 } ], "source": [ "peft_models = list(iter(list_models(filter=ModelFilter(library=\"peft\"), full=True)))\n", "len(peft_models)" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "6yfMtGYcOfOq", "outputId": "d59f125b-ae61-4aeb-9316-519543fba3c3" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "RepoFile: {'blob_id': None, 'lfs': None, 'rfilename': 'adapter_config.json', 'size': None}" ] }, "metadata": {}, "execution_count": 4 } ], "source": [ "peft_models[0].siblings[2]" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "jLEeIwZAOfOq", "outputId": "ed4d1041-46f7-473d-d53e-f7ffbf5d4248" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "{'base_model_name_or_path': 'facebook/opt-350m',\n", " 'bias': 'none',\n", " 'enable_lora': None,\n", " 'fan_in_fan_out': False,\n", " 'inference_mode': True,\n", " 'lora_alpha': 32,\n", " 'lora_dropout': 0.05,\n", " 'merge_weights': False,\n", " 'peft_type': 'LORA',\n", " 'r': 16,\n", " 'target_modules': ['q_proj', 'v_proj'],\n", " 'task_type': 'SEQ_CLS'}" ] }, "metadata": {}, "execution_count": 5 } ], "source": [ "httpx.get(hf_hub_url(peft_models[0].modelId,'adapter_config.json')).json()" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 36 }, "id": "xMM2229VOfOq", "outputId": "889bb7ad-c90f-41e7-98de-ec56a700ac44" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "'facebook/opt-350m'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 6 } ], "source": [ "httpx.get(hf_hub_url(peft_models[0].modelId,'adapter_config.json')).json().get('base_model_name_or_path')" ] }, { "cell_type": "code", "execution_count": 7, "metadata": { "id": "OjKGmWMDOfOr" }, "outputs": [], "source": [ "def try_get_base_model(model):\n", " model_id = model.modelId\n", " downloads = model.downloads\n", " author = model.author\n", " try:\n", " return model_id, httpx.get(hf_hub_url(model_id,'adapter_config.json')).json().get('base_model_name_or_path'), downloads, author\n", " except Exception:\n", " return None" ] }, { "cell_type": "code", "execution_count": 9, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 49, "referenced_widgets": [ "9dc99b649eaa4e4eb68d1aa37651566e", "efdcc8fa8b0d417ab2d63f5cee541aed", "a9a4ce193d224638bc76f527ead85cbf", "9ba1d7f9e9014d58a98a9e0ac45c7cc9", "f408225ced644598981dcf25fae01591", "1ab7d6ccc0f54e779f368ea719b4785b", "82aa5fcfa95a48089b63618a4120b6f6", "e32769c7cf2344549a5093f132d378e1", "56c3ec8fd04541808757d4c373258637", "d64eb69ca9934364b164ed432bb71141", "37dfab2a0c5c43dcac7b2cd6960bfda5" ] }, "id": "ovssytREOfOr", "outputId": "0c67429d-219c-4f58-9ae4-784a0accc1de" }, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ " 0%| | 0/6981 [00:00, ?it/s]" ], "application/vnd.jupyter.widget-view+json": { "version_major": 2, "version_minor": 0, "model_id": "9dc99b649eaa4e4eb68d1aa37651566e" } }, "metadata": {} } ], "source": [ "results = thread_map(try_get_base_model, peft_models)" ] }, { "cell_type": "code", "execution_count": 11, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 424 }, "id": "IGxeikIsOfOs", "outputId": "f8aadaf6-fc5c-47db-83fb-a4a2510764ea" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " model_id \\\n", "562 aarnphm/opt-6-7b-quotes \n", "914 artek0chumak/bloom-560m-safe-peft \n", "1061 peft-internal-testing/tiny-OPTForCausalLM-lora \n", "1065 peft-internal-testing/tiny_T5ForSeq2SeqLM-lora \n", "1063 peft-internal-testing/tiny_OPTForQuestionAnswe... \n", "... ... \n", "2569 KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... \n", "2567 KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... \n", "2566 KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... \n", "2565 KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... \n", "6980 AhmedBou/Falcon_7B_Science_Exam_QLoRA \n", "\n", " base_model downloads \\\n", "562 /home/ubuntu/.local/share/bentoml/models/pt-fa... 290304.0 \n", "914 bigscience/bloom-560m 33069.0 \n", "1061 hf-internal-testing/tiny-random-OPTForCausalLM 17217.0 \n", "1065 trl-internal-testing/tiny-T5ForConditionalGene... 15197.0 \n", "1063 hf-internal-testing/tiny-random-OPTForCausalLM 15182.0 \n", "... ... ... \n", "2569 gpt2 0.0 \n", "2567 gpt2 0.0 \n", "2566 gpt2 0.0 \n", "2565 gpt2 0.0 \n", "6980 tiiuae/falcon-7b 0.0 \n", "\n", " author \n", "562 aarnphm \n", "914 artek0chumak \n", "1061 peft-internal-testing \n", "1065 peft-internal-testing \n", "1063 peft-internal-testing \n", "... ... \n", "2569 KingKazma \n", "2567 KingKazma \n", "2566 KingKazma \n", "2565 KingKazma \n", "6980 AhmedBou \n", "\n", "[6663 rows x 4 columns]" ], "text/html": [ "\n", "
\n", " | model_id | \n", "base_model | \n", "downloads | \n", "author | \n", "
---|---|---|---|---|
562 | \n", "aarnphm/opt-6-7b-quotes | \n", "/home/ubuntu/.local/share/bentoml/models/pt-fa... | \n", "290304.0 | \n", "aarnphm | \n", "
914 | \n", "artek0chumak/bloom-560m-safe-peft | \n", "bigscience/bloom-560m | \n", "33069.0 | \n", "artek0chumak | \n", "
1061 | \n", "peft-internal-testing/tiny-OPTForCausalLM-lora | \n", "hf-internal-testing/tiny-random-OPTForCausalLM | \n", "17217.0 | \n", "peft-internal-testing | \n", "
1065 | \n", "peft-internal-testing/tiny_T5ForSeq2SeqLM-lora | \n", "trl-internal-testing/tiny-T5ForConditionalGene... | \n", "15197.0 | \n", "peft-internal-testing | \n", "
1063 | \n", "peft-internal-testing/tiny_OPTForQuestionAnswe... | \n", "hf-internal-testing/tiny-random-OPTForCausalLM | \n", "15182.0 | \n", "peft-internal-testing | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2569 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2567 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2566 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2565 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
6980 | \n", "AhmedBou/Falcon_7B_Science_Exam_QLoRA | \n", "tiiuae/falcon-7b | \n", "0.0 | \n", "AhmedBou | \n", "
6663 rows × 4 columns
\n", "\n", " | model_id | \n", "base_model | \n", "downloads | \n", "author | \n", "
---|---|---|---|---|
914 | \n", "artek0chumak/bloom-560m-safe-peft | \n", "bigscience/bloom-560m | \n", "33069.0 | \n", "artek0chumak | \n", "
1061 | \n", "peft-internal-testing/tiny-OPTForCausalLM-lora | \n", "hf-internal-testing/tiny-random-OPTForCausalLM | \n", "17217.0 | \n", "peft-internal-testing | \n", "
1065 | \n", "peft-internal-testing/tiny_T5ForSeq2SeqLM-lora | \n", "trl-internal-testing/tiny-T5ForConditionalGene... | \n", "15197.0 | \n", "peft-internal-testing | \n", "
1063 | \n", "peft-internal-testing/tiny_OPTForQuestionAnswe... | \n", "hf-internal-testing/tiny-random-OPTForCausalLM | \n", "15182.0 | \n", "peft-internal-testing | \n", "
1066 | \n", "peft-internal-testing/tiny_OPTForSequenceClass... | \n", "hf-internal-testing/tiny-random-OPTForCausalLM | \n", "15178.0 | \n", "peft-internal-testing | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2569 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2567 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2566 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
2565 | \n", "KingKazma/cnn_dailymail_gpt2_p_tuning_500_10_3... | \n", "gpt2 | \n", "0.0 | \n", "KingKazma | \n", "
6980 | \n", "AhmedBou/Falcon_7B_Science_Exam_QLoRA | \n", "tiiuae/falcon-7b | \n", "0.0 | \n", "AhmedBou | \n", "
5570 rows × 4 columns
\n", "