File size: 158,780 Bytes
14ada6c
1
{"cells":[{"cell_type":"markdown","id":"c454c018-02b7-4c3d-a21f-411748963a3f","metadata":{"id":"c454c018-02b7-4c3d-a21f-411748963a3f"},"source":["# Workshop: Sentiment Analysis"]},{"cell_type":"markdown","id":"2eda2e01-dfc4-42a6-9b6a-5cdf39fbce78","metadata":{"id":"2eda2e01-dfc4-42a6-9b6a-5cdf39fbce78"},"source":["<div>\n","<img src=\"https://lh3.googleusercontent.com/pw/ADCreHdzakFbNdHwBE1ZrwOiNCQibViWOir9DF9Dv4fbZEdWpx4mzFOT_RxkUGLTyDW7fQ0OwEyNQwqllupbvm0WiU0RNuFs-kWx1fTIvjiSkPGE5m64PilOIeApxQLwX_rl-JU7uYT-ROxdppIsJimCeos=w406-h451-s-no-gm?authuser=0\" width=\"390\"/>\n","</div>"]},{"cell_type":"code","source":["ls"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"eBO3zjLr0gY9","executionInfo":{"status":"ok","timestamp":1713839953212,"user_tz":-420,"elapsed":8,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"dc57b433-6f87-4904-99c2-0002d39a7c60"},"id":"eBO3zjLr0gY9","execution_count":1,"outputs":[{"output_type":"stream","name":"stdout","text":["\u001b[0m\u001b[01;34msample_data\u001b[0m/\n"]}]},{"cell_type":"code","source":["from google.colab import drive\n","drive.mount('/content/drive')"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"dXQK7eEb0mGr","executionInfo":{"status":"ok","timestamp":1713840022646,"user_tz":-420,"elapsed":25112,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"93400453-f2a5-4d20-f3bc-f7c03c8abf41"},"id":"dXQK7eEb0mGr","execution_count":2,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/drive\n"]}]},{"cell_type":"code","source":["cd \"/content/drive/MyDrive/689-WorkShop/Ass13-SemtimentAna\""],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"eB1rpKAu04zB","executionInfo":{"status":"ok","timestamp":1713840067921,"user_tz":-420,"elapsed":329,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"28e5fa28-6dd0-4891-fea8-b363826e9602"},"id":"eB1rpKAu04zB","execution_count":3,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/MyDrive/689-WorkShop/Ass13-SemtimentAna\n"]}]},{"cell_type":"code","source":["ls"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"g8kKS4TJ1CkA","executionInfo":{"status":"ok","timestamp":1713840076790,"user_tz":-420,"elapsed":834,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"cbc24ac9-9c22-4af4-de0e-38d3a0edd796"},"id":"g8kKS4TJ1CkA","execution_count":4,"outputs":[{"output_type":"stream","name":"stdout","text":["imdb_reviews.csv  WorkshopSentimentsAna-65130700309.ipynb  WorkshopSentimentsAna-std.ipynb\n"]}]},{"cell_type":"code","execution_count":5,"id":"7ef9db65-1fda-4fc6-8bb9-bc52bdbb9529","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"7ef9db65-1fda-4fc6-8bb9-bc52bdbb9529","executionInfo":{"status":"ok","timestamp":1713840098623,"user_tz":-420,"elapsed":14252,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"85c975d0-c099-4fc5-e228-b726da3fca93"},"outputs":[{"output_type":"stream","name":"stdout","text":["Requirement already satisfied: nltk in /usr/local/lib/python3.10/dist-packages (3.8.1)\n","Requirement already satisfied: click in /usr/local/lib/python3.10/dist-packages (from nltk) (8.1.7)\n","Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from nltk) (1.4.0)\n","Requirement already satisfied: regex>=2021.8.3 in /usr/local/lib/python3.10/dist-packages (from nltk) (2023.12.25)\n","Requirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from nltk) (4.66.2)\n","Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.40.0)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.13.4)\n","Requirement already satisfied: huggingface-hub<1.0,>=0.19.3 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.20.3)\n","Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.25.2)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (24.0)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.12.25)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n","Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.19.1)\n","Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.4.3)\n","Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.2)\n","Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (2023.6.0)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (4.11.0)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.3.2)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.7)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.7)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2024.2.2)\n"]}],"source":["!pip install nltk\n","!pip install transformers"]},{"cell_type":"markdown","id":"1a0b8ed9-f240-47b4-aa62-0cf48bdd7868","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"1a0b8ed9-f240-47b4-aa62-0cf48bdd7868"},"source":["## Rule-Based Approaches\n","\n","- **Lexicon-Based Methods**: Use sentiment lexicons or dictionaries that contain words annotated with their sentiment polarity (positive, negative, neutral).\n","- **Pattern Matching**: Identify sentiment based on predefined patterns or rules in the text.\n"]},{"cell_type":"code","execution_count":8,"id":"9f7f14b4-60ba-4a92-a9d0-a124e62fe03b","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"9f7f14b4-60ba-4a92-a9d0-a124e62fe03b","executionInfo":{"status":"ok","timestamp":1713840585023,"user_tz":-420,"elapsed":1966,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"c8ce549c-78f7-47b4-88f2-149744da949d"},"outputs":[{"output_type":"stream","name":"stderr","text":["[nltk_data] Downloading package stopwords to /root/nltk_data...\n","[nltk_data]   Unzipping corpora/stopwords.zip.\n","[nltk_data] Downloading package punkt to /root/nltk_data...\n","[nltk_data]   Unzipping tokenizers/punkt.zip.\n"]},{"output_type":"execute_result","data":{"text/plain":["True"]},"metadata":{},"execution_count":8}],"source":["import nltk\n","from nltk.tokenize import word_tokenize\n","from nltk.corpus import stopwords\n","\n","nltk.download('stopwords')\n","nltk.download('punkt')"]},{"cell_type":"code","execution_count":9,"id":"8a25f60f-f202-49cd-b965-e3ebb1676786","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"8a25f60f-f202-49cd-b965-e3ebb1676786","executionInfo":{"status":"ok","timestamp":1713840589093,"user_tz":-420,"elapsed":349,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fa23eaf9-86ce-41c8-de1d-01946a330f2e"},"outputs":[{"output_type":"stream","name":"stdout","text":["['i', 'me', 'my', 'myself', 'we', 'our', 'ours', 'ourselves', 'you', \"you're\", \"you've\", \"you'll\", \"you'd\", 'your', 'yours', 'yourself', 'yourselves', 'he', 'him', 'his', 'himself', 'she', \"she's\", 'her', 'hers', 'herself', 'it', \"it's\", 'its', 'itself', 'they', 'them', 'their', 'theirs', 'themselves', 'what', 'which', 'who', 'whom', 'this', 'that', \"that'll\", 'these', 'those', 'am', 'is', 'are', 'was', 'were', 'be', 'been', 'being', 'have', 'has', 'had', 'having', 'do', 'does', 'did', 'doing', 'a', 'an', 'the', 'and', 'but', 'if', 'or', 'because', 'as', 'until', 'while', 'of', 'at', 'by', 'for', 'with', 'about', 'against', 'between', 'into', 'through', 'during', 'before', 'after', 'above', 'below', 'to', 'from', 'up', 'down', 'in', 'out', 'on', 'off', 'over', 'under', 'again', 'further', 'then', 'once', 'here', 'there', 'when', 'where', 'why', 'how', 'all', 'any', 'both', 'each', 'few', 'more', 'most', 'other', 'some', 'such', 'no', 'nor', 'not', 'only', 'own', 'same', 'so', 'than', 'too', 'very', 's', 't', 'can', 'will', 'just', 'don', \"don't\", 'should', \"should've\", 'now', 'd', 'll', 'm', 'o', 're', 've', 'y', 'ain', 'aren', \"aren't\", 'couldn', \"couldn't\", 'didn', \"didn't\", 'doesn', \"doesn't\", 'hadn', \"hadn't\", 'hasn', \"hasn't\", 'haven', \"haven't\", 'isn', \"isn't\", 'ma', 'mightn', \"mightn't\", 'mustn', \"mustn't\", 'needn', \"needn't\", 'shan', \"shan't\", 'shouldn', \"shouldn't\", 'wasn', \"wasn't\", 'weren', \"weren't\", 'won', \"won't\", 'wouldn', \"wouldn't\"]\n"]}],"source":["print(stopwords.words('english'))"]},{"cell_type":"code","execution_count":10,"id":"7652d6d2-ba4c-4d02-bfe3-313b6e0f24a5","metadata":{"tags":[],"id":"7652d6d2-ba4c-4d02-bfe3-313b6e0f24a5","executionInfo":{"status":"ok","timestamp":1713841458584,"user_tz":-420,"elapsed":344,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["text = \"I had a good experience with the product. Highly recommended!\""]},{"cell_type":"code","execution_count":11,"id":"53fc7d50-59fa-4bec-9ae4-b93a1a3847f1","metadata":{"tags":[],"id":"53fc7d50-59fa-4bec-9ae4-b93a1a3847f1","executionInfo":{"status":"ok","timestamp":1713841468235,"user_tz":-420,"elapsed":318,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["tokens = word_tokenize(text.lower())"]},{"cell_type":"code","execution_count":12,"id":"faac761f-912e-44f7-b7b0-626baaea6a56","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"faac761f-912e-44f7-b7b0-626baaea6a56","executionInfo":{"status":"ok","timestamp":1713841469507,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fe91fd19-88d2-4913-c926-fed1f59089a6"},"outputs":[{"output_type":"stream","name":"stdout","text":["['i', 'had', 'a', 'good', 'experience', 'with', 'the', 'product', '.', 'highly', 'recommended', '!']\n"]}],"source":["print(tokens)"]},{"cell_type":"code","execution_count":13,"id":"9f6543a2-76f4-4993-b535-f90e50bada72","metadata":{"tags":[],"id":"9f6543a2-76f4-4993-b535-f90e50bada72","executionInfo":{"status":"ok","timestamp":1713841471657,"user_tz":-420,"elapsed":1,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["stop_words = set(stopwords.words('english'))"]},{"cell_type":"code","execution_count":14,"id":"4d7f529d-f006-48db-a092-2262f17cb3cd","metadata":{"tags":[],"id":"4d7f529d-f006-48db-a092-2262f17cb3cd","executionInfo":{"status":"ok","timestamp":1713841473288,"user_tz":-420,"elapsed":1,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["tokens = [word for word in tokens if word.isalnum() and word not in stop_words]  #alnum = alphanumeric"]},{"cell_type":"code","execution_count":15,"id":"4acfb41c-615d-4e8b-92dc-3f73a4188402","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"4acfb41c-615d-4e8b-92dc-3f73a4188402","executionInfo":{"status":"ok","timestamp":1713841476285,"user_tz":-420,"elapsed":352,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1ae566fc-8dab-41b8-9c8b-db17ec037666"},"outputs":[{"output_type":"stream","name":"stdout","text":["['good', 'experience', 'product', 'highly', 'recommended']\n"]}],"source":["print(tokens)"]},{"cell_type":"code","execution_count":null,"id":"c3cfd1cc-3f30-43de-a469-dec0b3816313","metadata":{"id":"c3cfd1cc-3f30-43de-a469-dec0b3816313"},"outputs":[],"source":[]},{"cell_type":"code","execution_count":16,"id":"aed2ad01-27e5-45e3-a55c-63084966a482","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"aed2ad01-27e5-45e3-a55c-63084966a482","executionInfo":{"status":"ok","timestamp":1713841613192,"user_tz":-420,"elapsed":313,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1156b9ea-186c-4282-8eb7-b7e6ce0328a3"},"outputs":[{"output_type":"stream","name":"stdout","text":["Sentiment: Positive\n"]}],"source":["# Sample positive and negative words\n","positive_words = set(['good', 'awesome', 'excellent', 'happy', 'positive'])\n","negative_words = set(['bad', 'terrible', 'poor', 'unhappy', 'negative'])\n","\n","def rule_based_sentiment_analysis(text):\n","    # Tokenize the text\n","    tokens = word_tokenize(text.lower())\n","\n","    # Remove stopwords\n","    stop_words = set(stopwords.words('english'))\n","    tokens = [word for word in tokens if word.isalnum() and word not in stop_words]  #alnum = alphanumeric\n","\n","    # Calculate sentiment score\n","    sentiment_score = sum(1 for word in tokens if word in positive_words) - sum(1 for word in tokens if word in negative_words)\n","\n","    # Classify sentiment\n","    if sentiment_score > 0:\n","        return 'Positive'\n","    elif sentiment_score < 0:\n","        return 'Negative'\n","    else:\n","        return 'Neutral'\n","\n","# Example usage\n","text_to_analyze = \"I had a good experience with the product. Highly recommended!\"\n","sentiment_result = rule_based_sentiment_analysis(text_to_analyze)\n","print(f\"Sentiment: {sentiment_result}\")"]},{"cell_type":"markdown","id":"21764069-0b07-4b3e-8103-b2ab464a9182","metadata":{"tags":[],"id":"21764069-0b07-4b3e-8103-b2ab464a9182"},"source":["## Machine Learning Approaches"]},{"cell_type":"markdown","id":"dc739c8a-a453-43d1-bdc5-ad10d823d748","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"dc739c8a-a453-43d1-bdc5-ad10d823d748"},"source":["### Import packages"]},{"cell_type":"code","execution_count":17,"id":"7e030b97-e111-45ea-b00f-09a360f3400e","metadata":{"tags":[],"id":"7e030b97-e111-45ea-b00f-09a360f3400e","executionInfo":{"status":"ok","timestamp":1713841657541,"user_tz":-420,"elapsed":720,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["import pandas as pd\n","from sklearn.pipeline import Pipeline\n","from sklearn.utils import shuffle\n","from sklearn.model_selection import train_test_split\n","from sklearn.feature_extraction.text import TfidfVectorizer\n","# from sklearn.svm import SVC\n","from sklearn.naive_bayes import MultinomialNB\n","from sklearn.metrics import classification_report, confusion_matrix\n","\n"]},{"cell_type":"markdown","id":"54c4fe66-f52f-487f-bfd5-0ea6e05206ce","metadata":{"tags":[],"id":"54c4fe66-f52f-487f-bfd5-0ea6e05206ce"},"source":["### TF-IDF vectorizer"]},{"cell_type":"markdown","id":"3f5b7e92-5de4-4894-b2be-47dac1cf2482","metadata":{"id":"3f5b7e92-5de4-4894-b2be-47dac1cf2482"},"source":["\n","<div>\n","<img src=\"https://www.kdnuggets.com/wp-content/uploads/awan_convert_text_documents_tfidf_matrix_tfidfvectorizer_3.png\" width=\"590\"/>\n","</div>\n","\n","\n","Image sources: https://www.kdnuggets.com/2022/09/convert-text-documents-tfidf-matrix-tfidfvectorizer.html\n","\n","\n","\n","\n"]},{"cell_type":"markdown","id":"9bd125fc-11fd-414a-b8f0-ff7ef628fb94","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"9bd125fc-11fd-414a-b8f0-ff7ef628fb94"},"source":["##### Example on Small data"]},{"cell_type":"code","execution_count":18,"id":"8a61fdce-6544-4774-bc29-265bf4afaa90","metadata":{"tags":[],"id":"8a61fdce-6544-4774-bc29-265bf4afaa90","executionInfo":{"status":"ok","timestamp":1713841845540,"user_tz":-420,"elapsed":360,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["\n","\n","# Sample data\n","documents = [\n","    \"This is the first document.\",\n","    \"This document is the second document.\",\n","    \"And this is the third one.\",\n","    \"Is this the first document?\"\n","]"]},{"cell_type":"code","execution_count":19,"id":"5794027b-2bee-46d9-9b4d-9cbaa7c4120f","metadata":{"tags":[],"id":"5794027b-2bee-46d9-9b4d-9cbaa7c4120f","executionInfo":{"status":"ok","timestamp":1713841849693,"user_tz":-420,"elapsed":471,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# Create a DataFrame for better visualization\n","df = pd.DataFrame({'Text': documents})"]},{"cell_type":"code","source":["df"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":175},"id":"Wje-T5kT712V","executionInfo":{"status":"ok","timestamp":1713841863619,"user_tz":-420,"elapsed":422,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"96738978-cc1b-4565-f336-173f2a348453"},"id":"Wje-T5kT712V","execution_count":20,"outputs":[{"output_type":"execute_result","data":{"text/plain":["                                    Text\n","0            This is the first document.\n","1  This document is the second document.\n","2             And this is the third one.\n","3            Is this the first document?"],"text/html":["\n","  <div id=\"df-a66940df-0fc7-4bfe-82ac-69f3b0c52155\" class=\"colab-df-container\">\n","    <div>\n","<style scoped>\n","    .dataframe tbody tr th:only-of-type {\n","        vertical-align: middle;\n","    }\n","\n","    .dataframe tbody tr th {\n","        vertical-align: top;\n","    }\n","\n","    .dataframe thead th {\n","        text-align: right;\n","    }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n","  <thead>\n","    <tr style=\"text-align: right;\">\n","      <th></th>\n","      <th>Text</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <th>0</th>\n","      <td>This is the first document.</td>\n","    </tr>\n","    <tr>\n","      <th>1</th>\n","      <td>This document is the second document.</td>\n","    </tr>\n","    <tr>\n","      <th>2</th>\n","      <td>And this is the third one.</td>\n","    </tr>\n","    <tr>\n","      <th>3</th>\n","      <td>Is this the first document?</td>\n","    </tr>\n","  </tbody>\n","</table>\n","</div>\n","    <div class=\"colab-df-buttons\">\n","\n","  <div class=\"colab-df-container\">\n","    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-a66940df-0fc7-4bfe-82ac-69f3b0c52155')\"\n","            title=\"Convert this dataframe to an interactive table.\"\n","            style=\"display:none;\">\n","\n","  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n","    <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n","  </svg>\n","    </button>\n","\n","  <style>\n","    .colab-df-container {\n","      display:flex;\n","      gap: 12px;\n","    }\n","\n","    .colab-df-convert {\n","      background-color: #E8F0FE;\n","      border: none;\n","      border-radius: 50%;\n","      cursor: pointer;\n","      display: none;\n","      fill: #1967D2;\n","      height: 32px;\n","      padding: 0 0 0 0;\n","      width: 32px;\n","    }\n","\n","    .colab-df-convert:hover {\n","      background-color: #E2EBFA;\n","      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n","      fill: #174EA6;\n","    }\n","\n","    .colab-df-buttons div {\n","      margin-bottom: 4px;\n","    }\n","\n","    [theme=dark] .colab-df-convert {\n","      background-color: #3B4455;\n","      fill: #D2E3FC;\n","    }\n","\n","    [theme=dark] .colab-df-convert:hover {\n","      background-color: #434B5C;\n","      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n","      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n","      fill: #FFFFFF;\n","    }\n","  </style>\n","\n","    <script>\n","      const buttonEl =\n","        document.querySelector('#df-a66940df-0fc7-4bfe-82ac-69f3b0c52155 button.colab-df-convert');\n","      buttonEl.style.display =\n","        google.colab.kernel.accessAllowed ? 'block' : 'none';\n","\n","      async function convertToInteractive(key) {\n","        const element = document.querySelector('#df-a66940df-0fc7-4bfe-82ac-69f3b0c52155');\n","        const dataTable =\n","          await google.colab.kernel.invokeFunction('convertToInteractive',\n","                                                    [key], {});\n","        if (!dataTable) return;\n","\n","        const docLinkHtml = 'Like what you see? Visit the ' +\n","          '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n","          + ' to learn more about interactive tables.';\n","        element.innerHTML = '';\n","        dataTable['output_type'] = 'display_data';\n","        await google.colab.output.renderOutput(dataTable, element);\n","        const docLink = document.createElement('div');\n","        docLink.innerHTML = docLinkHtml;\n","        element.appendChild(docLink);\n","      }\n","    </script>\n","  </div>\n","\n","\n","<div id=\"df-a349aca5-128d-48ef-b973-1f625f3c942c\">\n","  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-a349aca5-128d-48ef-b973-1f625f3c942c')\"\n","            title=\"Suggest charts\"\n","            style=\"display:none;\">\n","\n","<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n","     width=\"24px\">\n","    <g>\n","        <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n","    </g>\n","</svg>\n","  </button>\n","\n","<style>\n","  .colab-df-quickchart {\n","      --bg-color: #E8F0FE;\n","      --fill-color: #1967D2;\n","      --hover-bg-color: #E2EBFA;\n","      --hover-fill-color: #174EA6;\n","      --disabled-fill-color: #AAA;\n","      --disabled-bg-color: #DDD;\n","  }\n","\n","  [theme=dark] .colab-df-quickchart {\n","      --bg-color: #3B4455;\n","      --fill-color: #D2E3FC;\n","      --hover-bg-color: #434B5C;\n","      --hover-fill-color: #FFFFFF;\n","      --disabled-bg-color: #3B4455;\n","      --disabled-fill-color: #666;\n","  }\n","\n","  .colab-df-quickchart {\n","    background-color: var(--bg-color);\n","    border: none;\n","    border-radius: 50%;\n","    cursor: pointer;\n","    display: none;\n","    fill: var(--fill-color);\n","    height: 32px;\n","    padding: 0;\n","    width: 32px;\n","  }\n","\n","  .colab-df-quickchart:hover {\n","    background-color: var(--hover-bg-color);\n","    box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n","    fill: var(--button-hover-fill-color);\n","  }\n","\n","  .colab-df-quickchart-complete:disabled,\n","  .colab-df-quickchart-complete:disabled:hover {\n","    background-color: var(--disabled-bg-color);\n","    fill: var(--disabled-fill-color);\n","    box-shadow: none;\n","  }\n","\n","  .colab-df-spinner {\n","    border: 2px solid var(--fill-color);\n","    border-color: transparent;\n","    border-bottom-color: var(--fill-color);\n","    animation:\n","      spin 1s steps(1) infinite;\n","  }\n","\n","  @keyframes spin {\n","    0% {\n","      border-color: transparent;\n","      border-bottom-color: var(--fill-color);\n","      border-left-color: var(--fill-color);\n","    }\n","    20% {\n","      border-color: transparent;\n","      border-left-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","    }\n","    30% {\n","      border-color: transparent;\n","      border-left-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","      border-right-color: var(--fill-color);\n","    }\n","    40% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","    }\n","    60% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","    }\n","    80% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","      border-bottom-color: var(--fill-color);\n","    }\n","    90% {\n","      border-color: transparent;\n","      border-bottom-color: var(--fill-color);\n","    }\n","  }\n","</style>\n","\n","  <script>\n","    async function quickchart(key) {\n","      const quickchartButtonEl =\n","        document.querySelector('#' + key + ' button');\n","      quickchartButtonEl.disabled = true;  // To prevent multiple clicks.\n","      quickchartButtonEl.classList.add('colab-df-spinner');\n","      try {\n","        const charts = await google.colab.kernel.invokeFunction(\n","            'suggestCharts', [key], {});\n","      } catch (error) {\n","        console.error('Error during call to suggestCharts:', error);\n","      }\n","      quickchartButtonEl.classList.remove('colab-df-spinner');\n","      quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n","    }\n","    (() => {\n","      let quickchartButtonEl =\n","        document.querySelector('#df-a349aca5-128d-48ef-b973-1f625f3c942c button');\n","      quickchartButtonEl.style.display =\n","        google.colab.kernel.accessAllowed ? 'block' : 'none';\n","    })();\n","  </script>\n","</div>\n","    </div>\n","  </div>\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"df","summary":"{\n  \"name\": \"df\",\n  \"rows\": 4,\n  \"fields\": [\n    {\n      \"column\": \"Text\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 4,\n        \"samples\": [\n          \"This document is the second document.\",\n          \"Is this the first document?\",\n          \"This is the first document.\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    }\n  ]\n}"}},"metadata":{},"execution_count":20}]},{"cell_type":"code","execution_count":21,"id":"b49d5272-0383-4e39-910b-87276c4ffca2","metadata":{"tags":[],"id":"b49d5272-0383-4e39-910b-87276c4ffca2","executionInfo":{"status":"ok","timestamp":1713841867905,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# TF-IDF vectorization\n","vectorizer = TfidfVectorizer()\n","tfidf_matrix = vectorizer.fit_transform(df['Text'].tolist())"]},{"cell_type":"code","execution_count":22,"id":"46c0b47d-80ab-498b-91a2-7202f1c429fd","metadata":{"tags":[],"id":"46c0b47d-80ab-498b-91a2-7202f1c429fd","executionInfo":{"status":"ok","timestamp":1713841872560,"user_tz":-420,"elapsed":320,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# Convert the TF-IDF matrix to a DataFrame\n","tfidf_df = pd.DataFrame(tfidf_matrix.toarray(), columns=vectorizer.get_feature_names_out())"]},{"cell_type":"code","execution_count":23,"id":"91c2bee0-5bb6-44b9-a609-1f3d0e891ad4","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"91c2bee0-5bb6-44b9-a609-1f3d0e891ad4","executionInfo":{"status":"ok","timestamp":1713841877895,"user_tz":-420,"elapsed":339,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"cdd8422d-bf3a-42c1-a476-2b15d7f37157"},"outputs":[{"output_type":"stream","name":"stdout","text":["Original Data:\n","                                    Text\n","0            This is the first document.\n","1  This document is the second document.\n","2             And this is the third one.\n","3            Is this the first document?\n"]}],"source":["# Print the original data\n","print(\"Original Data:\")\n","print(df)"]},{"cell_type":"code","execution_count":24,"id":"24c4a522-8ef4-4001-ada6-031a043b9a54","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"24c4a522-8ef4-4001-ada6-031a043b9a54","executionInfo":{"status":"ok","timestamp":1713841882847,"user_tz":-420,"elapsed":344,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2606fbf1-fe41-4e03-899b-5d3f2776685f"},"outputs":[{"output_type":"stream","name":"stdout","text":["  (0, 1)\t0.46979138557992045\n","  (0, 2)\t0.5802858236844359\n","  (0, 6)\t0.38408524091481483\n","  (0, 3)\t0.38408524091481483\n","  (0, 8)\t0.38408524091481483\n","  (1, 5)\t0.5386476208856763\n","  (1, 1)\t0.6876235979836938\n","  (1, 6)\t0.281088674033753\n","  (1, 3)\t0.281088674033753\n","  (1, 8)\t0.281088674033753\n","  (2, 4)\t0.511848512707169\n","  (2, 7)\t0.511848512707169\n","  (2, 0)\t0.511848512707169\n","  (2, 6)\t0.267103787642168\n","  (2, 3)\t0.267103787642168\n","  (2, 8)\t0.267103787642168\n","  (3, 1)\t0.46979138557992045\n","  (3, 2)\t0.5802858236844359\n","  (3, 6)\t0.38408524091481483\n","  (3, 3)\t0.38408524091481483\n","  (3, 8)\t0.38408524091481483\n"]}],"source":["print(tfidf_matrix)"]},{"cell_type":"code","execution_count":25,"id":"6feb5892-284f-43d1-ab7b-5b13dbfadd0b","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"6feb5892-284f-43d1-ab7b-5b13dbfadd0b","executionInfo":{"status":"ok","timestamp":1713841924141,"user_tz":-420,"elapsed":341,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"0df619c6-eb05-43a0-da9d-7c0d3c0326b7"},"outputs":[{"output_type":"stream","name":"stdout","text":["\n","TF-IDF Matrix:\n","        and  document     first        is       one    second       the  \\\n","0  0.000000  0.469791  0.580286  0.384085  0.000000  0.000000  0.384085   \n","1  0.000000  0.687624  0.000000  0.281089  0.000000  0.538648  0.281089   \n","2  0.511849  0.000000  0.000000  0.267104  0.511849  0.000000  0.267104   \n","3  0.000000  0.469791  0.580286  0.384085  0.000000  0.000000  0.384085   \n","\n","      third      this  \n","0  0.000000  0.384085  \n","1  0.000000  0.281089  \n","2  0.511849  0.267104  \n","3  0.000000  0.384085  \n"]}],"source":["# Print the TF-IDF matrix\n","print(\"\\nTF-IDF Matrix:\")\n","print(tfidf_df)"]},{"cell_type":"markdown","id":"6802c239-edfa-462e-99ea-31386fd7aed4","metadata":{"tags":[],"id":"6802c239-edfa-462e-99ea-31386fd7aed4"},"source":["## Naive Bayes classifier trained on the TF-IDF features."]},{"cell_type":"markdown","id":"3accf6f8-6cae-4265-8d5d-fb5d40a07a2d","metadata":{"id":"3accf6f8-6cae-4265-8d5d-fb5d40a07a2d"},"source":["<div>\n","<img src=\"https://lh3.googleusercontent.com/pw/AP1GczOBxYJIFFWIiKJfFMdSp10-P1FNc6fZx7Wxa2NKpgw36p0Lady_mBMgxnKXS4cRbHwH2rnItp3cjvgIYdAN_LDcLlEzf1-8AJ62ybBOEGe8QKyH-CAojll13TKEDAo3yxwKvDh7wJRv2Rf1u7wWTjDI=w1911-h485-s-no-gm?authuser=0\" width=\"800\"/>\n","</div>\n"]},{"cell_type":"markdown","id":"9062063a-557b-4971-ad84-e3601b1a520e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"9062063a-557b-4971-ad84-e3601b1a520e"},"source":["### Read data/Preparation"]},{"cell_type":"code","execution_count":26,"id":"8d2eab09-03c7-441e-9c78-0c2e069f4d25","metadata":{"tags":[],"id":"8d2eab09-03c7-441e-9c78-0c2e069f4d25","executionInfo":{"status":"ok","timestamp":1713843412522,"user_tz":-420,"elapsed":3570,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# df = pd.read_csv(\"Womens_Clothing_E_Commerce_Reviews.csv\")\n","df = pd.read_csv(\"imdb_reviews.csv\")"]},{"cell_type":"code","execution_count":27,"id":"aca597f3-c8da-4314-990e-253d5ed719da","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"aca597f3-c8da-4314-990e-253d5ed719da","executionInfo":{"status":"ok","timestamp":1713843417599,"user_tz":-420,"elapsed":381,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1bc779d8-5cb6-4263-cfde-29f2a9ce6e82"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["(50000, 2)"]},"metadata":{},"execution_count":27}],"source":["df.shape"]},{"cell_type":"code","execution_count":28,"id":"7d8131e4-4a69-45af-aa12-335c926e308f","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":143},"id":"7d8131e4-4a69-45af-aa12-335c926e308f","executionInfo":{"status":"ok","timestamp":1713843430104,"user_tz":-420,"elapsed":994,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"03ebe55c-6c56-4084-cf22-0d4c48626788"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["                                                text     label\n","0  One of the other reviewers has mentioned that ...  positive\n","1  A wonderful little production. <br /><br />The...  positive\n","2  I thought this was a wonderful way to spend ti...  positive"],"text/html":["\n","  <div id=\"df-ea50fdb4-e951-4e4b-be83-2b339db320c3\" class=\"colab-df-container\">\n","    <div>\n","<style scoped>\n","    .dataframe tbody tr th:only-of-type {\n","        vertical-align: middle;\n","    }\n","\n","    .dataframe tbody tr th {\n","        vertical-align: top;\n","    }\n","\n","    .dataframe thead th {\n","        text-align: right;\n","    }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n","  <thead>\n","    <tr style=\"text-align: right;\">\n","      <th></th>\n","      <th>text</th>\n","      <th>label</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <th>0</th>\n","      <td>One of the other reviewers has mentioned that ...</td>\n","      <td>positive</td>\n","    </tr>\n","    <tr>\n","      <th>1</th>\n","      <td>A wonderful little production. &lt;br /&gt;&lt;br /&gt;The...</td>\n","      <td>positive</td>\n","    </tr>\n","    <tr>\n","      <th>2</th>\n","      <td>I thought this was a wonderful way to spend ti...</td>\n","      <td>positive</td>\n","    </tr>\n","  </tbody>\n","</table>\n","</div>\n","    <div class=\"colab-df-buttons\">\n","\n","  <div class=\"colab-df-container\">\n","    <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-ea50fdb4-e951-4e4b-be83-2b339db320c3')\"\n","            title=\"Convert this dataframe to an interactive table.\"\n","            style=\"display:none;\">\n","\n","  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n","    <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n","  </svg>\n","    </button>\n","\n","  <style>\n","    .colab-df-container {\n","      display:flex;\n","      gap: 12px;\n","    }\n","\n","    .colab-df-convert {\n","      background-color: #E8F0FE;\n","      border: none;\n","      border-radius: 50%;\n","      cursor: pointer;\n","      display: none;\n","      fill: #1967D2;\n","      height: 32px;\n","      padding: 0 0 0 0;\n","      width: 32px;\n","    }\n","\n","    .colab-df-convert:hover {\n","      background-color: #E2EBFA;\n","      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n","      fill: #174EA6;\n","    }\n","\n","    .colab-df-buttons div {\n","      margin-bottom: 4px;\n","    }\n","\n","    [theme=dark] .colab-df-convert {\n","      background-color: #3B4455;\n","      fill: #D2E3FC;\n","    }\n","\n","    [theme=dark] .colab-df-convert:hover {\n","      background-color: #434B5C;\n","      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n","      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n","      fill: #FFFFFF;\n","    }\n","  </style>\n","\n","    <script>\n","      const buttonEl =\n","        document.querySelector('#df-ea50fdb4-e951-4e4b-be83-2b339db320c3 button.colab-df-convert');\n","      buttonEl.style.display =\n","        google.colab.kernel.accessAllowed ? 'block' : 'none';\n","\n","      async function convertToInteractive(key) {\n","        const element = document.querySelector('#df-ea50fdb4-e951-4e4b-be83-2b339db320c3');\n","        const dataTable =\n","          await google.colab.kernel.invokeFunction('convertToInteractive',\n","                                                    [key], {});\n","        if (!dataTable) return;\n","\n","        const docLinkHtml = 'Like what you see? Visit the ' +\n","          '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n","          + ' to learn more about interactive tables.';\n","        element.innerHTML = '';\n","        dataTable['output_type'] = 'display_data';\n","        await google.colab.output.renderOutput(dataTable, element);\n","        const docLink = document.createElement('div');\n","        docLink.innerHTML = docLinkHtml;\n","        element.appendChild(docLink);\n","      }\n","    </script>\n","  </div>\n","\n","\n","<div id=\"df-1d88a78d-63c4-4def-85a3-c5435003219b\">\n","  <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-1d88a78d-63c4-4def-85a3-c5435003219b')\"\n","            title=\"Suggest charts\"\n","            style=\"display:none;\">\n","\n","<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n","     width=\"24px\">\n","    <g>\n","        <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n","    </g>\n","</svg>\n","  </button>\n","\n","<style>\n","  .colab-df-quickchart {\n","      --bg-color: #E8F0FE;\n","      --fill-color: #1967D2;\n","      --hover-bg-color: #E2EBFA;\n","      --hover-fill-color: #174EA6;\n","      --disabled-fill-color: #AAA;\n","      --disabled-bg-color: #DDD;\n","  }\n","\n","  [theme=dark] .colab-df-quickchart {\n","      --bg-color: #3B4455;\n","      --fill-color: #D2E3FC;\n","      --hover-bg-color: #434B5C;\n","      --hover-fill-color: #FFFFFF;\n","      --disabled-bg-color: #3B4455;\n","      --disabled-fill-color: #666;\n","  }\n","\n","  .colab-df-quickchart {\n","    background-color: var(--bg-color);\n","    border: none;\n","    border-radius: 50%;\n","    cursor: pointer;\n","    display: none;\n","    fill: var(--fill-color);\n","    height: 32px;\n","    padding: 0;\n","    width: 32px;\n","  }\n","\n","  .colab-df-quickchart:hover {\n","    background-color: var(--hover-bg-color);\n","    box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n","    fill: var(--button-hover-fill-color);\n","  }\n","\n","  .colab-df-quickchart-complete:disabled,\n","  .colab-df-quickchart-complete:disabled:hover {\n","    background-color: var(--disabled-bg-color);\n","    fill: var(--disabled-fill-color);\n","    box-shadow: none;\n","  }\n","\n","  .colab-df-spinner {\n","    border: 2px solid var(--fill-color);\n","    border-color: transparent;\n","    border-bottom-color: var(--fill-color);\n","    animation:\n","      spin 1s steps(1) infinite;\n","  }\n","\n","  @keyframes spin {\n","    0% {\n","      border-color: transparent;\n","      border-bottom-color: var(--fill-color);\n","      border-left-color: var(--fill-color);\n","    }\n","    20% {\n","      border-color: transparent;\n","      border-left-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","    }\n","    30% {\n","      border-color: transparent;\n","      border-left-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","      border-right-color: var(--fill-color);\n","    }\n","    40% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","      border-top-color: var(--fill-color);\n","    }\n","    60% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","    }\n","    80% {\n","      border-color: transparent;\n","      border-right-color: var(--fill-color);\n","      border-bottom-color: var(--fill-color);\n","    }\n","    90% {\n","      border-color: transparent;\n","      border-bottom-color: var(--fill-color);\n","    }\n","  }\n","</style>\n","\n","  <script>\n","    async function quickchart(key) {\n","      const quickchartButtonEl =\n","        document.querySelector('#' + key + ' button');\n","      quickchartButtonEl.disabled = true;  // To prevent multiple clicks.\n","      quickchartButtonEl.classList.add('colab-df-spinner');\n","      try {\n","        const charts = await google.colab.kernel.invokeFunction(\n","            'suggestCharts', [key], {});\n","      } catch (error) {\n","        console.error('Error during call to suggestCharts:', error);\n","      }\n","      quickchartButtonEl.classList.remove('colab-df-spinner');\n","      quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n","    }\n","    (() => {\n","      let quickchartButtonEl =\n","        document.querySelector('#df-1d88a78d-63c4-4def-85a3-c5435003219b button');\n","      quickchartButtonEl.style.display =\n","        google.colab.kernel.accessAllowed ? 'block' : 'none';\n","    })();\n","  </script>\n","</div>\n","    </div>\n","  </div>\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"df","summary":"{\n  \"name\": \"df\",\n  \"rows\": 50000,\n  \"fields\": [\n    {\n      \"column\": \"text\",\n      \"properties\": {\n        \"dtype\": \"string\",\n        \"num_unique_values\": 49582,\n        \"samples\": [\n          \"\\\"Soul Plane\\\" is a horrible attempt at comedy that only should appeal people with thick skulls, bloodshot eyes and furry pawns. <br /><br />The plot is not only incoherent but also non-existent, acting is mostly sub sub-par with a gang of highly moronic and dreadful characters thrown in for bad measure, jokes are often spotted miles ahead and almost never even a bit amusing. This movie lacks any structure and is full of racial stereotypes that must have seemed old even in the fifties, the only thing it really has going for it is some pretty ladies, but really, if you want that you can rent something from the \\\"Adult\\\" section. OK?<br /><br />I can hardly see anything here to recommend since you'll probably have a lot a better and productive time chasing rats with a sledgehammer or inventing waterproof teabags or whatever.<br /><br />2/10\",\n          \"Guest from the Future tells a fascinating story of time travel, friendship, battle of good and evil -- all with a small budget, child actors, and few special effects. Something for Spielberg and Lucas to learn from. ;) A sixth-grader Kolya \\\"Nick\\\" Gerasimov finds a time machine in the basement of a decrepit building and travels 100 years into the future. He discovers a near-perfect, utopian society where robots play guitars and write poetry, everyone is kind to each other and people enjoy everything technology has to offer. Alice is the daughter of a prominent scientist who invented a device called Mielophone that allows to read minds of humans and animals. The device can be put to both good and bad use, depending on whose hands it falls into. When two evil space pirates from Saturn who want to rule the universe attempt to steal Mielophone, it falls into the hands of 20th century school boy Nick. With the pirates hot on his tracks, he travels back to his time, followed by the pirates, and Alice. Chaos, confusion and funny situations follow as the luckless pirates try to blend in with the earthlings. Alice enrolls in the same school Nick goes to and demonstrates superhuman abilities in PE class. The catch is, Alice doesn't know what Nick looks like, while the pirates do. Also, the pirates are able to change their appearance and turn literally into anyone. (Hmm, I wonder if this is where James Cameron got the idea for Terminator...) Who gets to Nick -- and Mielophone -- first? Excellent plot, non-stop adventures, and great soundtrack. I wish Hollywood made kid movies like this one...\",\n          \"\\\"National Treasure\\\" (2004) is a thoroughly misguided hodge-podge of plot entanglements that borrow from nearly every cloak and dagger government conspiracy clich\\u00e9 that has ever been written. The film stars Nicholas Cage as Benjamin Franklin Gates (how precious is that, I ask you?); a seemingly normal fellow who, for no other reason than being of a lineage of like-minded misguided fortune hunters, decides to steal a 'national treasure' that has been hidden by the United States founding fathers. After a bit of subtext and background that plays laughably (unintentionally) like Indiana Jones meets The Patriot, the film degenerates into one misguided whimsy after another \\u0096 attempting to create a 'Stanley Goodspeed' regurgitation of Nicholas Cage and launch the whole convoluted mess forward with a series of high octane, but disconnected misadventures.<br /><br />The relevancy and logic to having George Washington and his motley crew of patriots burying a king's ransom someplace on native soil, and then, going through the meticulous plan of leaving clues scattered throughout U.S. currency art work, is something that director Jon Turteltaub never quite gets around to explaining. Couldn't Washington found better usage for such wealth during the start up of the country? Hence, we are left with a mystery built on top of an enigma that is already on shaky ground by the time Ben appoints himself the new custodian of this untold wealth. Ben's intentions are noble \\u0096 if confusing. He's set on protecting the treasure. For who and when?\\u0085your guess is as good as mine.<br /><br />But there are a few problems with Ben's crusade. First up, his friend, Ian Holmes (Sean Bean) decides that he can't wait for Ben to make up his mind about stealing the Declaration of Independence from the National Archives (oh, yeah \\u0096 brilliant idea!). Presumably, the back of that famous document holds the secret answer to the ultimate fortune. So Ian tries to kill Ben. The assassination attempt is, of course, unsuccessful, if overly melodramatic. It also affords Ben the opportunity to pick up, and pick on, the very sultry curator of the archives, Abigail Chase (Diane Kruger). She thinks Ben is clearly a nut \\u0096 at least at the beginning. But true to action/romance form, Abby's resolve melts quicker than you can say, \\\"is that the Hope Diamond?\\\" The film moves into full X-File-ish mode, as the FBI, mistakenly believing that Ben is behind the theft, retaliate in various benign ways that lead to a multi-layering of action sequences reminiscent of Mission Impossible meets The Fugitive. Honestly, don't those guys ever get 'intelligence' information that is correct? In the final analysis, \\\"National Treasure\\\" isn't great film making, so much as it's a patchwork rehash of tired old bits from other movies, woven together from scraps, the likes of which would make IL' Betsy Ross blush.<br /><br />The Buena Vista DVD delivers a far more generous treatment than this film is deserving of. The anamorphic widescreen picture exhibits a very smooth and finely detailed image with very rich colors, natural flesh tones, solid blacks and clean whites. The stylized image is also free of blemishes and digital enhancements. The audio is 5.1 and delivers a nice sonic boom to your side and rear speakers with intensity and realism. Extras include a host of promotional junket material that is rather deep and over the top in its explanation of how and why this film was made. If only, as an audience, we had had more clarification as to why Ben and co. were chasing after an illusive treasure, this might have been one good flick. Extras conclude with the theatrical trailer, audio commentary and deleted scenes. Not for the faint-hearted \\u0096 just the thick-headed.\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    },\n    {\n      \"column\": \"label\",\n      \"properties\": {\n        \"dtype\": \"category\",\n        \"num_unique_values\": 2,\n        \"samples\": [\n          \"negative\",\n          \"positive\"\n        ],\n        \"semantic_type\": \"\",\n        \"description\": \"\"\n      }\n    }\n  ]\n}"}},"metadata":{},"execution_count":28}],"source":["df.head(3)"]},{"cell_type":"code","execution_count":29,"id":"43a27caf-779b-4bd1-a3cf-fa641021172e","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"43a27caf-779b-4bd1-a3cf-fa641021172e","executionInfo":{"status":"ok","timestamp":1713843524562,"user_tz":-420,"elapsed":334,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fd1bd6c8-a340-49a2-deb8-e3a00e217a34"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["array(['positive', 'negative'], dtype=object)"]},"metadata":{},"execution_count":29}],"source":["df['label'].unique()"]},{"cell_type":"code","execution_count":null,"id":"c72dd5ec-59b2-4c7f-a8fb-fdade866984d","metadata":{"tags":[],"id":"c72dd5ec-59b2-4c7f-a8fb-fdade866984d"},"outputs":[],"source":["df['label'].unique()"]},{"cell_type":"code","execution_count":30,"id":"ba556f9b-da1c-4d13-8d70-563e0bd528a1","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"ba556f9b-da1c-4d13-8d70-563e0bd528a1","executionInfo":{"status":"ok","timestamp":1713843636003,"user_tz":-420,"elapsed":322,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"85b8ee33-108a-44b9-d395-e372c1b99b79"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["text     0\n","label    0\n","dtype: int64"]},"metadata":{},"execution_count":30}],"source":["df.isna().sum()"]},{"cell_type":"markdown","id":"819c31c3-873d-4d31-a21a-759059bd4c6d","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"819c31c3-873d-4d31-a21a-759059bd4c6d"},"source":["### Split the dataset into training and testing sets"]},{"cell_type":"code","execution_count":31,"id":"6ca318a2-26d7-446e-8324-6660171f239d","metadata":{"tags":[],"id":"6ca318a2-26d7-446e-8324-6660171f239d","executionInfo":{"status":"ok","timestamp":1713843687000,"user_tz":-420,"elapsed":1205,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["train_data, test_data, train_labels, test_labels = train_test_split(df['text'], df['label'], test_size=0.3, random_state=42)"]},{"cell_type":"code","execution_count":32,"id":"f0cfc8fc-49e5-4c88-bb33-8084dcf00100","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"f0cfc8fc-49e5-4c88-bb33-8084dcf00100","executionInfo":{"status":"ok","timestamp":1713843694590,"user_tz":-420,"elapsed":329,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"767e8a04-ed3d-466f-a935-15eab7cdb83f"},"outputs":[{"output_type":"stream","name":"stdout","text":["38094    As much as I love trains, I couldn't stomach t...\n","40624    This was a very good PPV, but like Wrestlemani...\n","49425    Not finding the right words is everybody's pro...\n","35734    I'm really suprised this movie didn't get a hi...\n","41708    I'll start by confessing that I tend to really...\n","                               ...                        \n","11284    `Shadow Magic' recaptures the joy and amazemen...\n","44732    I found this movie to be quite enjoyable and f...\n","38158    Avoid this one! It is a terrible movie. So wha...\n","860      This production was quite a surprise for me. I...\n","15795    This is a decent movie. Although little bit sh...\n","Name: text, Length: 35000, dtype: object\n"]}],"source":["print(train_data)"]},{"cell_type":"code","execution_count":33,"id":"51d0a415-4982-43dd-8864-c189ba6826f4","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"51d0a415-4982-43dd-8864-c189ba6826f4","executionInfo":{"status":"ok","timestamp":1713843697940,"user_tz":-420,"elapsed":311,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"8167d4df-179d-4cf9-bf14-9112184e98be"},"outputs":[{"output_type":"stream","name":"stdout","text":["38094    negative\n","40624    positive\n","49425    negative\n","35734    positive\n","41708    negative\n","           ...   \n","11284    positive\n","44732    positive\n","38158    negative\n","860      positive\n","15795    positive\n","Name: label, Length: 35000, dtype: object\n"]}],"source":["print(train_labels)"]},{"cell_type":"markdown","id":"42987cdb-4cdf-46df-95d8-7c2b2824c1ee","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"42987cdb-4cdf-46df-95d8-7c2b2824c1ee"},"source":["### Create a pipeline"]},{"cell_type":"code","execution_count":34,"id":"06ffd548-c333-4c1a-87ce-9699ddd116ee","metadata":{"tags":[],"id":"06ffd548-c333-4c1a-87ce-9699ddd116ee","executionInfo":{"status":"ok","timestamp":1713843715911,"user_tz":-420,"elapsed":333,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["sentiment_pipeline = Pipeline([\n","    ('tfidf', TfidfVectorizer()),\n","    ('nb', MultinomialNB())\n","])"]},{"cell_type":"markdown","id":"6bafa7cd-8d0b-4725-bd40-4a3b04634fab","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"6bafa7cd-8d0b-4725-bd40-4a3b04634fab"},"source":["### Train the model using the pipeline"]},{"cell_type":"code","execution_count":35,"id":"712dea09-52c2-4a9f-8bf9-3cbb273fe4b5","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":126},"id":"712dea09-52c2-4a9f-8bf9-3cbb273fe4b5","executionInfo":{"status":"ok","timestamp":1713844075138,"user_tz":-420,"elapsed":9437,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fda94af1-772d-4175-ee65-ab856819dea7"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["Pipeline(steps=[('tfidf', TfidfVectorizer()), ('nb', MultinomialNB())])"],"text/html":["<style>#sk-container-id-1 {color: black;background-color: white;}#sk-container-id-1 pre{padding: 0;}#sk-container-id-1 div.sk-toggleable {background-color: white;}#sk-container-id-1 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-1 label.sk-toggleable__label-arrow:before {content: \"β–Έ\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-1 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-1 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-1 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-1 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-1 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-1 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"β–Ύ\";}#sk-container-id-1 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-1 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-1 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-1 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-1 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-1 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-1 div.sk-item {position: relative;z-index: 1;}#sk-container-id-1 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-1 div.sk-item::before, #sk-container-id-1 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-1 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-1 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-1 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-1 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-1 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-1 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-1 div.sk-label-container {text-align: center;}#sk-container-id-1 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-1 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-1\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>Pipeline(steps=[(&#x27;tfidf&#x27;, TfidfVectorizer()), (&#x27;nb&#x27;, MultinomialNB())])</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item sk-dashed-wrapped\"><div class=\"sk-label-container\"><div class=\"sk-label sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-1\" type=\"checkbox\" ><label for=\"sk-estimator-id-1\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">Pipeline</label><div class=\"sk-toggleable__content\"><pre>Pipeline(steps=[(&#x27;tfidf&#x27;, TfidfVectorizer()), (&#x27;nb&#x27;, MultinomialNB())])</pre></div></div></div><div class=\"sk-serial\"><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-2\" type=\"checkbox\" ><label for=\"sk-estimator-id-2\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">TfidfVectorizer</label><div class=\"sk-toggleable__content\"><pre>TfidfVectorizer()</pre></div></div></div><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-3\" type=\"checkbox\" ><label for=\"sk-estimator-id-3\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">MultinomialNB</label><div class=\"sk-toggleable__content\"><pre>MultinomialNB()</pre></div></div></div></div></div></div></div>"]},"metadata":{},"execution_count":35}],"source":["sentiment_pipeline.fit(train_data, train_labels)\n"]},{"cell_type":"markdown","id":"4c95c599-ae0d-433f-9ed5-856fd9fa35e0","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"4c95c599-ae0d-433f-9ed5-856fd9fa35e0"},"source":["### Make predictions on the test set"]},{"cell_type":"code","execution_count":36,"id":"37ae9eda-4a02-4f40-bdeb-ecb8ea67f9d3","metadata":{"tags":[],"id":"37ae9eda-4a02-4f40-bdeb-ecb8ea67f9d3","executionInfo":{"status":"ok","timestamp":1713844081489,"user_tz":-420,"elapsed":3301,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["predictions = sentiment_pipeline.predict(test_data)"]},{"cell_type":"code","source":["test_data[1]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":109},"id":"a620DunmGUpx","executionInfo":{"status":"ok","timestamp":1713844697926,"user_tz":-420,"elapsed":4,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"6109017f-a264-46b9-cd2a-db7d91158ba0"},"id":"a620DunmGUpx","execution_count":43,"outputs":[{"output_type":"execute_result","data":{"text/plain":["'A wonderful little production. <br /><br />The filming technique is very unassuming- very old-time-BBC fashion and gives a comforting, and sometimes discomforting, sense of realism to the entire piece. <br /><br />The actors are extremely well chosen- Michael Sheen not only \"has got all the polari\" but he has all the voices down pat too! You can truly see the seamless editing guided by the references to Williams\\' diary entries, not only is it well worth the watching but it is a terrificly written and performed piece. A masterful production about one of the great master\\'s of comedy and his life. <br /><br />The realism really comes home with the little things: the fantasy of the guard which, rather than use the traditional \\'dream\\' techniques remains solid then disappears. It plays on our knowledge and our senses, particularly with the scenes concerning Orton and Halliwell and the sets (particularly of their flat with Halliwell\\'s murals decorating every surface) are terribly well done.'"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"string"}},"metadata":{},"execution_count":43}]},{"cell_type":"code","source":["test_labels[1]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":36},"id":"qmW5xhMgGae6","executionInfo":{"status":"ok","timestamp":1713844689037,"user_tz":-420,"elapsed":4,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2f9176d6-62cc-454b-cf06-292c2682f59f"},"id":"qmW5xhMgGae6","execution_count":41,"outputs":[{"output_type":"execute_result","data":{"text/plain":["'positive'"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"string"}},"metadata":{},"execution_count":41}]},{"cell_type":"code","source":["predictions"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"9p7uhKVvEXQn","executionInfo":{"status":"ok","timestamp":1713844095757,"user_tz":-420,"elapsed":312,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"310851b4-6a8e-4308-f477-a932a640c26c"},"id":"9p7uhKVvEXQn","execution_count":37,"outputs":[{"output_type":"execute_result","data":{"text/plain":["array(['negative', 'positive', 'negative', ..., 'negative', 'positive',\n","       'positive'], dtype='<U8')"]},"metadata":{},"execution_count":37}]},{"cell_type":"markdown","id":"a33458e2-90cb-4c94-b977-8cc8ea5a273e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"a33458e2-90cb-4c94-b977-8cc8ea5a273e"},"source":["### Evaluate the model"]},{"cell_type":"code","source":["test_data.shape"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"XDecs57CGtrY","executionInfo":{"status":"ok","timestamp":1713844728124,"user_tz":-420,"elapsed":387,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2e38875f-dc30-455f-ec6c-4a66024c76ba"},"id":"XDecs57CGtrY","execution_count":44,"outputs":[{"output_type":"execute_result","data":{"text/plain":["(15000,)"]},"metadata":{},"execution_count":44}]},{"cell_type":"code","source":["test_labels.shape"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"KfDAFQETG1b-","executionInfo":{"status":"ok","timestamp":1713844744202,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"245bf06a-0b44-4466-ba0f-c4fde614c1cc"},"id":"KfDAFQETG1b-","execution_count":45,"outputs":[{"output_type":"execute_result","data":{"text/plain":["(15000,)"]},"metadata":{},"execution_count":45}]},{"cell_type":"code","execution_count":46,"id":"9ad90567-93d2-4090-81be-5c77f41e379a","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"9ad90567-93d2-4090-81be-5c77f41e379a","executionInfo":{"status":"ok","timestamp":1713844759769,"user_tz":-420,"elapsed":831,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"f7aad793-8a18-4799-85f4-11d3b5df0955"},"outputs":[{"output_type":"stream","name":"stdout","text":["Classification Report:\n","               precision    recall  f1-score   support\n","\n","    negative       0.84      0.89      0.86      7411\n","    positive       0.89      0.83      0.86      7589\n","\n","    accuracy                           0.86     15000\n","   macro avg       0.86      0.86      0.86     15000\n","weighted avg       0.86      0.86      0.86     15000\n","\n"]}],"source":["\n","report = classification_report(test_labels, predictions)\n","\n","print(\"Classification Report:\\n\", report)"]},{"cell_type":"code","execution_count":47,"id":"ef002e29-d065-4825-a076-3d23fdfa7b59","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"ef002e29-d065-4825-a076-3d23fdfa7b59","executionInfo":{"status":"ok","timestamp":1713844776999,"user_tz":-420,"elapsed":331,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"8ebfdcdc-b29a-4e50-a8c1-c32256472966"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["array([[6620,  791],\n","       [1296, 6293]])"]},"metadata":{},"execution_count":47}],"source":["cm = confusion_matrix(test_labels, predictions)\n","cm"]},{"cell_type":"markdown","id":"6e7729bb-a833-4feb-bd2a-b04a2741bd70","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"6e7729bb-a833-4feb-bd2a-b04a2741bd70"},"source":["## Huggingface: Pre-trained sentiment analysis model\n","\n","https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english"]},{"cell_type":"code","execution_count":48,"id":"9afad444-c2cc-4f3d-b49d-07a723be6154","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":291,"referenced_widgets":["6b743d09e2a24a54a0302a0aee69cc90","764f39f3c28841ba9d96fcda0daa750f","dfef59134fb040c99e9d5e2d22704629","2d753be068804858bd6a158932e8be07","c62ddd64f9c84a8f958b59c7eb3907fe","32d4d98140914c6c97bbd3b18902cef3","ab486ae08df34e688cb514a0f1ff17e8","9e094454e05f432fac232399c525c820","1fad54a4f83147eaac49f8bfd07786be","4e5b866634e342119e8c17b299c494d3","868625142e274217806ae6793e7bba1e","57fdcbfad44045d9926eb6be9b0e98e4","6f76b70971734347af420200eb4e7961","227592f3c9ce45ed980e06711e16da32","553d95aeca14426ea0cfe1658c670929","20e75f776514473b917f07a1f948bbee","21752585844c4b0a9d3e9be9a91e08ec","92823464dc54474cbff9219bfd4d7e85","0955564b996f4ce296532505fcf7b2b5","dcabc828dbe04b73ac7667ed57cddba4","5778deb87339492886307c0a27e48941","935ade78484944fc9fc3822b86629ae7","a7d41b7b84854d81aa4fd154e4cd95cf","c038edf8e1b246b0956232182e5aa083","3b8487f5e7cb4ba5b13173f5afa41743","19dbb9ba4aa6461da50f7c27dae38194","014878ccbd574925a16453332f50b006","e09f5c2db82d4a8f85522a4da34b8e39","2ef82c50224f492aa999726610a399a1","32d1750a89c24d2f8adc77795355fee8","5bcc77b7a6d34a0dae6d00278d221d5e","d83e05f8c52445edbe640678b8961dd4","502fd49e91d94d6f8a35b5d755d74af1","9a6820b62ba24698b607aa592c2569f4","e57391fa7a9449d18de6d6cdb2fb8b22","27869bcaf68344d3b051270dbbfd2f14","045cdec112a4421b8867cdc0f3c51312","d7f66508bf454fcdbe3b86049b3b07dd","92b7a96a86bb4354b9201b5a6c797464","bb6c8ec2753c4a13ac5d830b27a5b086","18d0ecc027564d52a35ac3de71e14e5d","35dfe7bbe8334855b42a555400fa2bac","28671e25f8c94f539252c2ee0c4423ac","5b9ec995dc9842f181644d1b02806333"]},"id":"9afad444-c2cc-4f3d-b49d-07a723be6154","executionInfo":{"status":"ok","timestamp":1713844938786,"user_tz":-420,"elapsed":18112,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"06e47173-f131-45c9-8383-73b169407e74"},"outputs":[{"output_type":"stream","name":"stderr","text":["/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:88: UserWarning: \n","The secret `HF_TOKEN` does not exist in your Colab secrets.\n","To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n","You will be able to reuse this secret in all of your notebooks.\n","Please note that authentication is recommended but still optional to access public models or datasets.\n","  warnings.warn(\n"]},{"output_type":"display_data","data":{"text/plain":["config.json:   0%|          | 0.00/629 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6b743d09e2a24a54a0302a0aee69cc90"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["model.safetensors:   0%|          | 0.00/268M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"57fdcbfad44045d9926eb6be9b0e98e4"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a7d41b7b84854d81aa4fd154e4cd95cf"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"9a6820b62ba24698b607aa592c2569f4"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["[{'label': 'POSITIVE', 'score': 0.9998656511306763},\n"," {'label': 'NEGATIVE', 'score': 0.9991129040718079}]"]},"metadata":{},"execution_count":48}],"source":["\n","from transformers import pipeline\n","sentiment_analyzer = pipeline('sentiment-analysis', model =\"distilbert-base-uncased-finetuned-sst-2-english\") #, revision =\"af0f99b\")\n","data = [\"I love you\", \"I hate you\"]\n","sentiment_analyzer(data)\n"]},{"cell_type":"code","execution_count":49,"id":"4987efd9-8ca8-40b1-90cc-ff361207fb8f","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"4987efd9-8ca8-40b1-90cc-ff361207fb8f","executionInfo":{"status":"ok","timestamp":1713844974003,"user_tz":-420,"elapsed":327,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"4e317a6e-3b89-4218-e33a-cbcbe6773ad4"},"outputs":[{"output_type":"stream","name":"stdout","text":["[{'label': 'POSITIVE', 'score': 0.9996837377548218}]\n"]}],"source":["result = sentiment_analyzer(\"I love using this model!\")\n","print(result)"]},{"cell_type":"markdown","id":"68436dda-e3c3-499d-b390-60443f9a1796","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"68436dda-e3c3-499d-b390-60443f9a1796"},"source":["## Huggingface: Thai"]},{"cell_type":"markdown","id":"72a9f8e0-12bf-403b-8b78-e381a65e9eaa","metadata":{"id":"72a9f8e0-12bf-403b-8b78-e381a65e9eaa"},"source":["### model=\"poom-sci/WangchanBERTa-finetuned-sentiment\"\n","\n","https://huggingface.co/poom-sci/WangchanBERTa-finetuned-sentiment"]},{"cell_type":"code","execution_count":50,"id":"d698825b-3bd7-4370-871f-ac6e5fe5fe47","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":245,"referenced_widgets":["a9e58e66a3b74a7a970d39c82240ee3d","d92b56350ecc4599920d9a639d985e48","799faec48b7c4b4a8217a7ae95a3348e","7655233e992f4487a8ffb26b775f203c","6cc7ca687d364b0aa320405368cebfb1","81cf201494024fdb86fb8aba5fec1684","b5eaf04b11284c13b24b5de37760b6ac","18a4efa47c184134b1fb9b1b4192e766","fbd0194ca4044406b2687d56d0006ea7","0d5462301c70484fa0af5f7d7bf5f870","3eb96c9075b04716ae3efeaa84ab027c","e697264388a941b1b296a6ffd94c4955","7619792f1e804121bd210faebd479fec","d7609127cb61448eb0375ad5eaf5a464","9588b4252d554a3caaed831a4da17769","ab426d04502b4114aa5238a0acab1325","39361e3cbf2644cc986b57dafed52e7b","87b90dc01ab545cba91c3313ad61de4e","2b13da36a00343b7929479c35826fe50","38b4787b345e48c3b945b429664f8d3d","079587d2e31546879f8349ade0007505","e9e7c9ca02934159946e6d0d77e6aaa2","eaf3e21d333545a7b6f99f4a3c2dd32d","80a0f41ee58d4dbd9068a2da541e7ab1","d0e4c46296d5466b93ca20a6dedf6ca2","67a23012dc984dcba98c2bbe3345f47c","425bb0a1ca204144a59f5352eae932cb","aef4654647424865bc40844d174666ce","fa71ffe79a5841aa83cbb2712af0d2ed","0dec19543ab842dfaa0c9672da1341ac","c8abf179a9ec4539a1f67a94af1b5ebd","a9b09ef660f04001b1540fbaa8fb8619","14b4c51735484be285cd540a15ea71e4","a9b5ad8768474490a496e527e5434285","a891122437dc425bb13c831efe311e69","4cec9a9f2630431db8a626f2332e8eba","3ab1d042923e426991132a0e4d5d9214","6cef7c9514e74a7d9e0e8ad6a45c2764","20c6909e78f8420d82d7ccd4a3b90600","21db3d4f160f4d6a8d16d56b1f8145c1","af663b93360045a1ac9c5a553895f8dd","e57f85a430494e049cfefb631ca80c4b","dcc24dba7e014f03b6507e4674fdedbd","cbf5367b9a474cd597126f9b44a091a2","edee0ea2881947d88a88e30bbe704227","fbc7838167cd4416b67d23019b6449cc","23bd28ecfee94b879aa9a7242ff5f3a8","951dca5617c147f1ac4e13420dbc8092","0729c7bad2c54b468c652a3636a3f33a","aa8d847812bd4c3caeb1155f1bbd47e8","af97f90e51054a8d9e7114e131a20a76","8f9db8f97d43461b930600d5f728e630","ad24f48277ce4cb6bdd08829bbbafb7f","22e3e9e7755049a28fc2133b3cad808a","5efc41cf659f4146a01263112f58b43c","77cb395146a545148f7784450c10e4fd","cf00433fc3ff4e46bea7b268cf585ffa","69866f6b67e94c0e87519f1a47dfaf3b","570414a7ae604eef88fc2a2c38637bff","e53c8ef1e9e64c46b28444192c7f6005","05e5df8dd9a94658afbd9968c6a88196","d5de73166aaf41ccbb8795bc0a76cd66","d875b3552444402d80b870192244c726","cf2e96fc2f09426393a7339c1b8882e3","cf7a76769a934ea292595d4d84d19757","3e4c9662eb0a4d6fa372ffd33d0feaff"]},"id":"d698825b-3bd7-4370-871f-ac6e5fe5fe47","executionInfo":{"status":"ok","timestamp":1713844989621,"user_tz":-420,"elapsed":7775,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"662bbdb1-1ea5-411f-b4af-b28a47581779"},"outputs":[{"output_type":"display_data","data":{"text/plain":["config.json:   0%|          | 0.00/965 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a9e58e66a3b74a7a970d39c82240ee3d"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["pytorch_model.bin:   0%|          | 0.00/421M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"e697264388a941b1b296a6ffd94c4955"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer_config.json:   0%|          | 0.00/491 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"eaf3e21d333545a7b6f99f4a3c2dd32d"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["sentencepiece.bpe.model:   0%|          | 0.00/905k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a9b5ad8768474490a496e527e5434285"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer.json:   0%|          | 0.00/1.38M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"edee0ea2881947d88a88e30bbe704227"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["special_tokens_map.json:   0%|          | 0.00/305 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"77cb395146a545148f7784450c10e4fd"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["[{'label': 'pos', 'score': 0.9793058037757874},\n"," {'label': 'neg', 'score': 0.7835226058959961}]"]},"metadata":{},"execution_count":50}],"source":["from transformers import pipeline\n","\n","sentiment_analyzer = pipeline('sentiment-analysis', model=\"poom-sci/WangchanBERTa-finetuned-sentiment\")#, revision=\"b78d071\")\n","\n","data = [\"ΰΈ­ΰΈ£ΰΉˆΰΈ­ΰΈ’ΰΈˆΰΈ±ΰΈ”ΰΉ†\", \"รอนานแท้\"]\n","sentiment_analyzer(data)\n"]},{"cell_type":"code","execution_count":51,"id":"87d815d4-135c-471e-93ee-cacc93653d4e","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"87d815d4-135c-471e-93ee-cacc93653d4e","executionInfo":{"status":"ok","timestamp":1713844999105,"user_tz":-420,"elapsed":404,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"a9ee94dc-6c6f-4345-f4e8-409c45efc9d3"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["[{'label': 'neg', 'score': 0.7488928437232971}]"]},"metadata":{},"execution_count":51}],"source":["sentiment_analyzer(\"ΰΈ‚ΰΉ‰ΰΈ²ΰΈ§ΰΈšΰΈΉΰΈ”\")"]},{"cell_type":"code","execution_count":null,"id":"60f5c43a-6cb7-47f1-85c5-751e91599ad9","metadata":{"id":"60f5c43a-6cb7-47f1-85c5-751e91599ad9"},"outputs":[],"source":[]},{"cell_type":"markdown","id":"f894a4bd-1f04-4126-aa8d-e0211b41687e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"f894a4bd-1f04-4126-aa8d-e0211b41687e"},"source":["## Deploy on Streamlit Sharing\n","\n","https://share.streamlit.io/  or https://huggingface.co/spaces\n","\n","https://docs.streamlit.io/library/api-reference\n","\n","https://github.com/\n","\n"]},{"cell_type":"code","execution_count":52,"id":"dfd5baee-dc74-4f6d-84be-52a2b89d0f28","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"dfd5baee-dc74-4f6d-84be-52a2b89d0f28","executionInfo":{"status":"ok","timestamp":1713845688947,"user_tz":-420,"elapsed":361,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"c880bab7-3b44-44cb-dda9-e674a5edf97f"},"outputs":[{"output_type":"stream","name":"stdout","text":["Writing app_senti_65130700309.py\n"]}],"source":["\n","%%writefile app_senti_65130700309.py\n","\n","\n","import streamlit as st\n","from transformers import pipeline\n","\n","# Load the sentiment analysis model\n","model_name = \"poom-sci/WangchanBERTa-finetuned-sentiment\"\n","sentiment_analyzer = pipeline('sentiment-analysis', model=model_name)\n","\n","# Streamlit app\n","st.title(\"Thai Sentiment Analysis App\")\n","\n","# Input text\n","text_input = st.text_area(\"Enter Thai text for sentiment analysis\", \"ΰΈ‚ΰΈ­ΰΈ„ΰΈ§ΰΈ²ΰΈ‘ΰΉ€ΰΈ«ΰΉ‡ΰΈ™ΰΈ«ΰΈ™ΰΉˆΰΈ­ΰΈ’... \")\n","\n","# Button to trigger analysis\n","if st.button(\"Analyze Sentiment\"):\n","    # Analyze sentiment using the model\n","    results = sentiment_analyzer([text_input])\n","\n","    # Extract sentiment and score\n","    sentiment = results[0]['label']\n","    score = results[0]['score']\n","\n","\n","    # Display result as progress bars\n","    st.subheader(\"Sentiment Analysis Result:\")\n","\n","    if sentiment == 'pos':\n","        st.success(f\"Positive Sentiment (Score: {score:.2f})\")\n","        st.progress(score)\n","    elif sentiment == 'neg':\n","        st.error(f\"Negative Sentiment (Score: {score:.2f})\")\n","        st.progress(score)\n","    else:\n","        st.warning(f\"Neutral Sentiment (Score: {score:.2f})\")\n","        st.progress(score)\n"]},{"cell_type":"code","execution_count":53,"id":"70111967-b904-4f18-a8d0-0c8701ec35ab","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"70111967-b904-4f18-a8d0-0c8701ec35ab","executionInfo":{"status":"ok","timestamp":1713845696482,"user_tz":-420,"elapsed":341,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"4eb475a7-6b7b-44a0-e09b-32150e4d717b"},"outputs":[{"output_type":"stream","name":"stdout","text":["Writing requirements.txt\n"]}],"source":["%%writefile requirements.txt\n","transformers\n","torch\n"]},{"cell_type":"code","execution_count":null,"id":"88001002-587d-403d-ab65-d060bde9d42d","metadata":{"id":"88001002-587d-403d-ab65-d060bde9d42d"},"outputs":[],"source":[]}],"metadata":{"kernelspec":{"display_name":"Python 3 (ipykernel)","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.11.3"},"colab":{"provenance":[]},"widgets":{"application/vnd.jupyter.widget-state+json":{"6b743d09e2a24a54a0302a0aee69cc90":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_764f39f3c28841ba9d96fcda0daa750f","IPY_MODEL_dfef59134fb040c99e9d5e2d22704629","IPY_MODEL_2d753be068804858bd6a158932e8be07"],"layout":"IPY_MODEL_c62ddd64f9c84a8f958b59c7eb3907fe"}},"764f39f3c28841ba9d96fcda0daa750f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_32d4d98140914c6c97bbd3b18902cef3","placeholder":"​","style":"IPY_MODEL_ab486ae08df34e688cb514a0f1ff17e8","value":"config.json: 100%"}},"dfef59134fb040c99e9d5e2d22704629":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_9e094454e05f432fac232399c525c820","max":629,"min":0,"orientation":"horizontal","style":"IPY_MODEL_1fad54a4f83147eaac49f8bfd07786be","value":629}},"2d753be068804858bd6a158932e8be07":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_4e5b866634e342119e8c17b299c494d3","placeholder":"​","style":"IPY_MODEL_868625142e274217806ae6793e7bba1e","value":" 629/629 [00:00&lt;00:00, 22.0kB/s]"}},"c62ddd64f9c84a8f958b59c7eb3907fe":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"32d4d98140914c6c97bbd3b18902cef3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ab486ae08df34e688cb514a0f1ff17e8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9e094454e05f432fac232399c525c820":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"1fad54a4f83147eaac49f8bfd07786be":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"4e5b866634e342119e8c17b299c494d3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"868625142e274217806ae6793e7bba1e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"57fdcbfad44045d9926eb6be9b0e98e4":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_6f76b70971734347af420200eb4e7961","IPY_MODEL_227592f3c9ce45ed980e06711e16da32","IPY_MODEL_553d95aeca14426ea0cfe1658c670929"],"layout":"IPY_MODEL_20e75f776514473b917f07a1f948bbee"}},"6f76b70971734347af420200eb4e7961":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_21752585844c4b0a9d3e9be9a91e08ec","placeholder":"​","style":"IPY_MODEL_92823464dc54474cbff9219bfd4d7e85","value":"model.safetensors: 100%"}},"227592f3c9ce45ed980e06711e16da32":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_0955564b996f4ce296532505fcf7b2b5","max":267832558,"min":0,"orientation":"horizontal","style":"IPY_MODEL_dcabc828dbe04b73ac7667ed57cddba4","value":267832558}},"553d95aeca14426ea0cfe1658c670929":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5778deb87339492886307c0a27e48941","placeholder":"​","style":"IPY_MODEL_935ade78484944fc9fc3822b86629ae7","value":" 268M/268M [00:02&lt;00:00, 56.5MB/s]"}},"20e75f776514473b917f07a1f948bbee":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"21752585844c4b0a9d3e9be9a91e08ec":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"92823464dc54474cbff9219bfd4d7e85":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"0955564b996f4ce296532505fcf7b2b5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"dcabc828dbe04b73ac7667ed57cddba4":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5778deb87339492886307c0a27e48941":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"935ade78484944fc9fc3822b86629ae7":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a7d41b7b84854d81aa4fd154e4cd95cf":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_c038edf8e1b246b0956232182e5aa083","IPY_MODEL_3b8487f5e7cb4ba5b13173f5afa41743","IPY_MODEL_19dbb9ba4aa6461da50f7c27dae38194"],"layout":"IPY_MODEL_014878ccbd574925a16453332f50b006"}},"c038edf8e1b246b0956232182e5aa083":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e09f5c2db82d4a8f85522a4da34b8e39","placeholder":"​","style":"IPY_MODEL_2ef82c50224f492aa999726610a399a1","value":"tokenizer_config.json: 100%"}},"3b8487f5e7cb4ba5b13173f5afa41743":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_32d1750a89c24d2f8adc77795355fee8","max":48,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5bcc77b7a6d34a0dae6d00278d221d5e","value":48}},"19dbb9ba4aa6461da50f7c27dae38194":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d83e05f8c52445edbe640678b8961dd4","placeholder":"​","style":"IPY_MODEL_502fd49e91d94d6f8a35b5d755d74af1","value":" 48.0/48.0 [00:00&lt;00:00, 1.73kB/s]"}},"014878ccbd574925a16453332f50b006":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e09f5c2db82d4a8f85522a4da34b8e39":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2ef82c50224f492aa999726610a399a1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"32d1750a89c24d2f8adc77795355fee8":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5bcc77b7a6d34a0dae6d00278d221d5e":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"d83e05f8c52445edbe640678b8961dd4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"502fd49e91d94d6f8a35b5d755d74af1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9a6820b62ba24698b607aa592c2569f4":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_e57391fa7a9449d18de6d6cdb2fb8b22","IPY_MODEL_27869bcaf68344d3b051270dbbfd2f14","IPY_MODEL_045cdec112a4421b8867cdc0f3c51312"],"layout":"IPY_MODEL_d7f66508bf454fcdbe3b86049b3b07dd"}},"e57391fa7a9449d18de6d6cdb2fb8b22":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_92b7a96a86bb4354b9201b5a6c797464","placeholder":"​","style":"IPY_MODEL_bb6c8ec2753c4a13ac5d830b27a5b086","value":"vocab.txt: 100%"}},"27869bcaf68344d3b051270dbbfd2f14":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_18d0ecc027564d52a35ac3de71e14e5d","max":231508,"min":0,"orientation":"horizontal","style":"IPY_MODEL_35dfe7bbe8334855b42a555400fa2bac","value":231508}},"045cdec112a4421b8867cdc0f3c51312":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_28671e25f8c94f539252c2ee0c4423ac","placeholder":"​","style":"IPY_MODEL_5b9ec995dc9842f181644d1b02806333","value":" 232k/232k [00:00&lt;00:00, 4.50MB/s]"}},"d7f66508bf454fcdbe3b86049b3b07dd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"92b7a96a86bb4354b9201b5a6c797464":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"bb6c8ec2753c4a13ac5d830b27a5b086":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"18d0ecc027564d52a35ac3de71e14e5d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"35dfe7bbe8334855b42a555400fa2bac":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"28671e25f8c94f539252c2ee0c4423ac":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5b9ec995dc9842f181644d1b02806333":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a9e58e66a3b74a7a970d39c82240ee3d":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_d92b56350ecc4599920d9a639d985e48","IPY_MODEL_799faec48b7c4b4a8217a7ae95a3348e","IPY_MODEL_7655233e992f4487a8ffb26b775f203c"],"layout":"IPY_MODEL_6cc7ca687d364b0aa320405368cebfb1"}},"d92b56350ecc4599920d9a639d985e48":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_81cf201494024fdb86fb8aba5fec1684","placeholder":"​","style":"IPY_MODEL_b5eaf04b11284c13b24b5de37760b6ac","value":"config.json: 100%"}},"799faec48b7c4b4a8217a7ae95a3348e":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_18a4efa47c184134b1fb9b1b4192e766","max":965,"min":0,"orientation":"horizontal","style":"IPY_MODEL_fbd0194ca4044406b2687d56d0006ea7","value":965}},"7655233e992f4487a8ffb26b775f203c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_0d5462301c70484fa0af5f7d7bf5f870","placeholder":"​","style":"IPY_MODEL_3eb96c9075b04716ae3efeaa84ab027c","value":" 965/965 [00:00&lt;00:00, 34.6kB/s]"}},"6cc7ca687d364b0aa320405368cebfb1":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"81cf201494024fdb86fb8aba5fec1684":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b5eaf04b11284c13b24b5de37760b6ac":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"18a4efa47c184134b1fb9b1b4192e766":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fbd0194ca4044406b2687d56d0006ea7":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"0d5462301c70484fa0af5f7d7bf5f870":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3eb96c9075b04716ae3efeaa84ab027c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e697264388a941b1b296a6ffd94c4955":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_7619792f1e804121bd210faebd479fec","IPY_MODEL_d7609127cb61448eb0375ad5eaf5a464","IPY_MODEL_9588b4252d554a3caaed831a4da17769"],"layout":"IPY_MODEL_ab426d04502b4114aa5238a0acab1325"}},"7619792f1e804121bd210faebd479fec":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_39361e3cbf2644cc986b57dafed52e7b","placeholder":"​","style":"IPY_MODEL_87b90dc01ab545cba91c3313ad61de4e","value":"pytorch_model.bin: 100%"}},"d7609127cb61448eb0375ad5eaf5a464":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_2b13da36a00343b7929479c35826fe50","max":421072237,"min":0,"orientation":"horizontal","style":"IPY_MODEL_38b4787b345e48c3b945b429664f8d3d","value":421072237}},"9588b4252d554a3caaed831a4da17769":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_079587d2e31546879f8349ade0007505","placeholder":"​","style":"IPY_MODEL_e9e7c9ca02934159946e6d0d77e6aaa2","value":" 421M/421M [00:04&lt;00:00, 164MB/s]"}},"ab426d04502b4114aa5238a0acab1325":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"39361e3cbf2644cc986b57dafed52e7b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"87b90dc01ab545cba91c3313ad61de4e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2b13da36a00343b7929479c35826fe50":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"38b4787b345e48c3b945b429664f8d3d":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"079587d2e31546879f8349ade0007505":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e9e7c9ca02934159946e6d0d77e6aaa2":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"eaf3e21d333545a7b6f99f4a3c2dd32d":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_80a0f41ee58d4dbd9068a2da541e7ab1","IPY_MODEL_d0e4c46296d5466b93ca20a6dedf6ca2","IPY_MODEL_67a23012dc984dcba98c2bbe3345f47c"],"layout":"IPY_MODEL_425bb0a1ca204144a59f5352eae932cb"}},"80a0f41ee58d4dbd9068a2da541e7ab1":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_aef4654647424865bc40844d174666ce","placeholder":"​","style":"IPY_MODEL_fa71ffe79a5841aa83cbb2712af0d2ed","value":"tokenizer_config.json: 100%"}},"d0e4c46296d5466b93ca20a6dedf6ca2":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_0dec19543ab842dfaa0c9672da1341ac","max":491,"min":0,"orientation":"horizontal","style":"IPY_MODEL_c8abf179a9ec4539a1f67a94af1b5ebd","value":491}},"67a23012dc984dcba98c2bbe3345f47c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a9b09ef660f04001b1540fbaa8fb8619","placeholder":"​","style":"IPY_MODEL_14b4c51735484be285cd540a15ea71e4","value":" 491/491 [00:00&lt;00:00, 16.6kB/s]"}},"425bb0a1ca204144a59f5352eae932cb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"aef4654647424865bc40844d174666ce":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fa71ffe79a5841aa83cbb2712af0d2ed":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"0dec19543ab842dfaa0c9672da1341ac":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c8abf179a9ec4539a1f67a94af1b5ebd":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a9b09ef660f04001b1540fbaa8fb8619":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"14b4c51735484be285cd540a15ea71e4":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a9b5ad8768474490a496e527e5434285":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a891122437dc425bb13c831efe311e69","IPY_MODEL_4cec9a9f2630431db8a626f2332e8eba","IPY_MODEL_3ab1d042923e426991132a0e4d5d9214"],"layout":"IPY_MODEL_6cef7c9514e74a7d9e0e8ad6a45c2764"}},"a891122437dc425bb13c831efe311e69":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_20c6909e78f8420d82d7ccd4a3b90600","placeholder":"​","style":"IPY_MODEL_21db3d4f160f4d6a8d16d56b1f8145c1","value":"sentencepiece.bpe.model: 100%"}},"4cec9a9f2630431db8a626f2332e8eba":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_af663b93360045a1ac9c5a553895f8dd","max":904693,"min":0,"orientation":"horizontal","style":"IPY_MODEL_e57f85a430494e049cfefb631ca80c4b","value":904693}},"3ab1d042923e426991132a0e4d5d9214":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_dcc24dba7e014f03b6507e4674fdedbd","placeholder":"​","style":"IPY_MODEL_cbf5367b9a474cd597126f9b44a091a2","value":" 905k/905k [00:00&lt;00:00, 2.94MB/s]"}},"6cef7c9514e74a7d9e0e8ad6a45c2764":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"20c6909e78f8420d82d7ccd4a3b90600":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"21db3d4f160f4d6a8d16d56b1f8145c1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"af663b93360045a1ac9c5a553895f8dd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e57f85a430494e049cfefb631ca80c4b":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"dcc24dba7e014f03b6507e4674fdedbd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cbf5367b9a474cd597126f9b44a091a2":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"edee0ea2881947d88a88e30bbe704227":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_fbc7838167cd4416b67d23019b6449cc","IPY_MODEL_23bd28ecfee94b879aa9a7242ff5f3a8","IPY_MODEL_951dca5617c147f1ac4e13420dbc8092"],"layout":"IPY_MODEL_0729c7bad2c54b468c652a3636a3f33a"}},"fbc7838167cd4416b67d23019b6449cc":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_aa8d847812bd4c3caeb1155f1bbd47e8","placeholder":"​","style":"IPY_MODEL_af97f90e51054a8d9e7114e131a20a76","value":"tokenizer.json: 100%"}},"23bd28ecfee94b879aa9a7242ff5f3a8":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_8f9db8f97d43461b930600d5f728e630","max":1377628,"min":0,"orientation":"horizontal","style":"IPY_MODEL_ad24f48277ce4cb6bdd08829bbbafb7f","value":1377628}},"951dca5617c147f1ac4e13420dbc8092":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_22e3e9e7755049a28fc2133b3cad808a","placeholder":"​","style":"IPY_MODEL_5efc41cf659f4146a01263112f58b43c","value":" 1.38M/1.38M [00:00&lt;00:00, 31.3MB/s]"}},"0729c7bad2c54b468c652a3636a3f33a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"aa8d847812bd4c3caeb1155f1bbd47e8":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"af97f90e51054a8d9e7114e131a20a76":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8f9db8f97d43461b930600d5f728e630":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ad24f48277ce4cb6bdd08829bbbafb7f":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"22e3e9e7755049a28fc2133b3cad808a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5efc41cf659f4146a01263112f58b43c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"77cb395146a545148f7784450c10e4fd":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_cf00433fc3ff4e46bea7b268cf585ffa","IPY_MODEL_69866f6b67e94c0e87519f1a47dfaf3b","IPY_MODEL_570414a7ae604eef88fc2a2c38637bff"],"layout":"IPY_MODEL_e53c8ef1e9e64c46b28444192c7f6005"}},"cf00433fc3ff4e46bea7b268cf585ffa":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_05e5df8dd9a94658afbd9968c6a88196","placeholder":"​","style":"IPY_MODEL_d5de73166aaf41ccbb8795bc0a76cd66","value":"special_tokens_map.json: 100%"}},"69866f6b67e94c0e87519f1a47dfaf3b":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_d875b3552444402d80b870192244c726","max":305,"min":0,"orientation":"horizontal","style":"IPY_MODEL_cf2e96fc2f09426393a7339c1b8882e3","value":305}},"570414a7ae604eef88fc2a2c38637bff":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_cf7a76769a934ea292595d4d84d19757","placeholder":"​","style":"IPY_MODEL_3e4c9662eb0a4d6fa372ffd33d0feaff","value":" 305/305 [00:00&lt;00:00, 16.4kB/s]"}},"e53c8ef1e9e64c46b28444192c7f6005":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"05e5df8dd9a94658afbd9968c6a88196":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d5de73166aaf41ccbb8795bc0a76cd66":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"d875b3552444402d80b870192244c726":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cf2e96fc2f09426393a7339c1b8882e3":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"cf7a76769a934ea292595d4d84d19757":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3e4c9662eb0a4d6fa372ffd33d0feaff":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}}},"nbformat":4,"nbformat_minor":5}