Spaces:
Sleeping
Sleeping
File size: 158,780 Bytes
14ada6c |
1 |
{"cells":[{"cell_type":"markdown","id":"c454c018-02b7-4c3d-a21f-411748963a3f","metadata":{"id":"c454c018-02b7-4c3d-a21f-411748963a3f"},"source":["# Workshop: Sentiment Analysis"]},{"cell_type":"markdown","id":"2eda2e01-dfc4-42a6-9b6a-5cdf39fbce78","metadata":{"id":"2eda2e01-dfc4-42a6-9b6a-5cdf39fbce78"},"source":["<div>\n","<img src=\"https://lh3.googleusercontent.com/pw/ADCreHdzakFbNdHwBE1ZrwOiNCQibViWOir9DF9Dv4fbZEdWpx4mzFOT_RxkUGLTyDW7fQ0OwEyNQwqllupbvm0WiU0RNuFs-kWx1fTIvjiSkPGE5m64PilOIeApxQLwX_rl-JU7uYT-ROxdppIsJimCeos=w406-h451-s-no-gm?authuser=0\" width=\"390\"/>\n","</div>"]},{"cell_type":"code","source":["ls"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"eBO3zjLr0gY9","executionInfo":{"status":"ok","timestamp":1713839953212,"user_tz":-420,"elapsed":8,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"dc57b433-6f87-4904-99c2-0002d39a7c60"},"id":"eBO3zjLr0gY9","execution_count":1,"outputs":[{"output_type":"stream","name":"stdout","text":["\u001b[0m\u001b[01;34msample_data\u001b[0m/\n"]}]},{"cell_type":"code","source":["from google.colab import drive\n","drive.mount('/content/drive')"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"dXQK7eEb0mGr","executionInfo":{"status":"ok","timestamp":1713840022646,"user_tz":-420,"elapsed":25112,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"93400453-f2a5-4d20-f3bc-f7c03c8abf41"},"id":"dXQK7eEb0mGr","execution_count":2,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/drive\n"]}]},{"cell_type":"code","source":["cd \"/content/drive/MyDrive/689-WorkShop/Ass13-SemtimentAna\""],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"eB1rpKAu04zB","executionInfo":{"status":"ok","timestamp":1713840067921,"user_tz":-420,"elapsed":329,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"28e5fa28-6dd0-4891-fea8-b363826e9602"},"id":"eB1rpKAu04zB","execution_count":3,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/MyDrive/689-WorkShop/Ass13-SemtimentAna\n"]}]},{"cell_type":"code","source":["ls"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"g8kKS4TJ1CkA","executionInfo":{"status":"ok","timestamp":1713840076790,"user_tz":-420,"elapsed":834,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"cbc24ac9-9c22-4af4-de0e-38d3a0edd796"},"id":"g8kKS4TJ1CkA","execution_count":4,"outputs":[{"output_type":"stream","name":"stdout","text":["imdb_reviews.csv WorkshopSentimentsAna-65130700309.ipynb WorkshopSentimentsAna-std.ipynb\n"]}]},{"cell_type":"code","execution_count":5,"id":"7ef9db65-1fda-4fc6-8bb9-bc52bdbb9529","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"7ef9db65-1fda-4fc6-8bb9-bc52bdbb9529","executionInfo":{"status":"ok","timestamp":1713840098623,"user_tz":-420,"elapsed":14252,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"85c975d0-c099-4fc5-e228-b726da3fca93"},"outputs":[{"output_type":"stream","name":"stdout","text":["Requirement already satisfied: nltk in /usr/local/lib/python3.10/dist-packages (3.8.1)\n","Requirement already satisfied: click in /usr/local/lib/python3.10/dist-packages (from nltk) (8.1.7)\n","Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from nltk) (1.4.0)\n","Requirement already satisfied: regex>=2021.8.3 in /usr/local/lib/python3.10/dist-packages (from nltk) (2023.12.25)\n","Requirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from nltk) (4.66.2)\n","Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.40.0)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.13.4)\n","Requirement already satisfied: huggingface-hub<1.0,>=0.19.3 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.20.3)\n","Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.25.2)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (24.0)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.12.25)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n","Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.19.1)\n","Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.4.3)\n","Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.2)\n","Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (2023.6.0)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (4.11.0)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.3.2)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.7)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.7)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2024.2.2)\n"]}],"source":["!pip install nltk\n","!pip install transformers"]},{"cell_type":"markdown","id":"1a0b8ed9-f240-47b4-aa62-0cf48bdd7868","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"1a0b8ed9-f240-47b4-aa62-0cf48bdd7868"},"source":["## Rule-Based Approaches\n","\n","- **Lexicon-Based Methods**: Use sentiment lexicons or dictionaries that contain words annotated with their sentiment polarity (positive, negative, neutral).\n","- **Pattern Matching**: Identify sentiment based on predefined patterns or rules in the text.\n"]},{"cell_type":"code","execution_count":8,"id":"9f7f14b4-60ba-4a92-a9d0-a124e62fe03b","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"9f7f14b4-60ba-4a92-a9d0-a124e62fe03b","executionInfo":{"status":"ok","timestamp":1713840585023,"user_tz":-420,"elapsed":1966,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"c8ce549c-78f7-47b4-88f2-149744da949d"},"outputs":[{"output_type":"stream","name":"stderr","text":["[nltk_data] Downloading package stopwords to /root/nltk_data...\n","[nltk_data] Unzipping corpora/stopwords.zip.\n","[nltk_data] Downloading package punkt to /root/nltk_data...\n","[nltk_data] Unzipping tokenizers/punkt.zip.\n"]},{"output_type":"execute_result","data":{"text/plain":["True"]},"metadata":{},"execution_count":8}],"source":["import nltk\n","from nltk.tokenize import word_tokenize\n","from nltk.corpus import stopwords\n","\n","nltk.download('stopwords')\n","nltk.download('punkt')"]},{"cell_type":"code","execution_count":9,"id":"8a25f60f-f202-49cd-b965-e3ebb1676786","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"8a25f60f-f202-49cd-b965-e3ebb1676786","executionInfo":{"status":"ok","timestamp":1713840589093,"user_tz":-420,"elapsed":349,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fa23eaf9-86ce-41c8-de1d-01946a330f2e"},"outputs":[{"output_type":"stream","name":"stdout","text":["['i', 'me', 'my', 'myself', 'we', 'our', 'ours', 'ourselves', 'you', \"you're\", \"you've\", \"you'll\", \"you'd\", 'your', 'yours', 'yourself', 'yourselves', 'he', 'him', 'his', 'himself', 'she', \"she's\", 'her', 'hers', 'herself', 'it', \"it's\", 'its', 'itself', 'they', 'them', 'their', 'theirs', 'themselves', 'what', 'which', 'who', 'whom', 'this', 'that', \"that'll\", 'these', 'those', 'am', 'is', 'are', 'was', 'were', 'be', 'been', 'being', 'have', 'has', 'had', 'having', 'do', 'does', 'did', 'doing', 'a', 'an', 'the', 'and', 'but', 'if', 'or', 'because', 'as', 'until', 'while', 'of', 'at', 'by', 'for', 'with', 'about', 'against', 'between', 'into', 'through', 'during', 'before', 'after', 'above', 'below', 'to', 'from', 'up', 'down', 'in', 'out', 'on', 'off', 'over', 'under', 'again', 'further', 'then', 'once', 'here', 'there', 'when', 'where', 'why', 'how', 'all', 'any', 'both', 'each', 'few', 'more', 'most', 'other', 'some', 'such', 'no', 'nor', 'not', 'only', 'own', 'same', 'so', 'than', 'too', 'very', 's', 't', 'can', 'will', 'just', 'don', \"don't\", 'should', \"should've\", 'now', 'd', 'll', 'm', 'o', 're', 've', 'y', 'ain', 'aren', \"aren't\", 'couldn', \"couldn't\", 'didn', \"didn't\", 'doesn', \"doesn't\", 'hadn', \"hadn't\", 'hasn', \"hasn't\", 'haven', \"haven't\", 'isn', \"isn't\", 'ma', 'mightn', \"mightn't\", 'mustn', \"mustn't\", 'needn', \"needn't\", 'shan', \"shan't\", 'shouldn', \"shouldn't\", 'wasn', \"wasn't\", 'weren', \"weren't\", 'won', \"won't\", 'wouldn', \"wouldn't\"]\n"]}],"source":["print(stopwords.words('english'))"]},{"cell_type":"code","execution_count":10,"id":"7652d6d2-ba4c-4d02-bfe3-313b6e0f24a5","metadata":{"tags":[],"id":"7652d6d2-ba4c-4d02-bfe3-313b6e0f24a5","executionInfo":{"status":"ok","timestamp":1713841458584,"user_tz":-420,"elapsed":344,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["text = \"I had a good experience with the product. Highly recommended!\""]},{"cell_type":"code","execution_count":11,"id":"53fc7d50-59fa-4bec-9ae4-b93a1a3847f1","metadata":{"tags":[],"id":"53fc7d50-59fa-4bec-9ae4-b93a1a3847f1","executionInfo":{"status":"ok","timestamp":1713841468235,"user_tz":-420,"elapsed":318,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["tokens = word_tokenize(text.lower())"]},{"cell_type":"code","execution_count":12,"id":"faac761f-912e-44f7-b7b0-626baaea6a56","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"faac761f-912e-44f7-b7b0-626baaea6a56","executionInfo":{"status":"ok","timestamp":1713841469507,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fe91fd19-88d2-4913-c926-fed1f59089a6"},"outputs":[{"output_type":"stream","name":"stdout","text":["['i', 'had', 'a', 'good', 'experience', 'with', 'the', 'product', '.', 'highly', 'recommended', '!']\n"]}],"source":["print(tokens)"]},{"cell_type":"code","execution_count":13,"id":"9f6543a2-76f4-4993-b535-f90e50bada72","metadata":{"tags":[],"id":"9f6543a2-76f4-4993-b535-f90e50bada72","executionInfo":{"status":"ok","timestamp":1713841471657,"user_tz":-420,"elapsed":1,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["stop_words = set(stopwords.words('english'))"]},{"cell_type":"code","execution_count":14,"id":"4d7f529d-f006-48db-a092-2262f17cb3cd","metadata":{"tags":[],"id":"4d7f529d-f006-48db-a092-2262f17cb3cd","executionInfo":{"status":"ok","timestamp":1713841473288,"user_tz":-420,"elapsed":1,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["tokens = [word for word in tokens if word.isalnum() and word not in stop_words] #alnum = alphanumeric"]},{"cell_type":"code","execution_count":15,"id":"4acfb41c-615d-4e8b-92dc-3f73a4188402","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"4acfb41c-615d-4e8b-92dc-3f73a4188402","executionInfo":{"status":"ok","timestamp":1713841476285,"user_tz":-420,"elapsed":352,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1ae566fc-8dab-41b8-9c8b-db17ec037666"},"outputs":[{"output_type":"stream","name":"stdout","text":["['good', 'experience', 'product', 'highly', 'recommended']\n"]}],"source":["print(tokens)"]},{"cell_type":"code","execution_count":null,"id":"c3cfd1cc-3f30-43de-a469-dec0b3816313","metadata":{"id":"c3cfd1cc-3f30-43de-a469-dec0b3816313"},"outputs":[],"source":[]},{"cell_type":"code","execution_count":16,"id":"aed2ad01-27e5-45e3-a55c-63084966a482","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"aed2ad01-27e5-45e3-a55c-63084966a482","executionInfo":{"status":"ok","timestamp":1713841613192,"user_tz":-420,"elapsed":313,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1156b9ea-186c-4282-8eb7-b7e6ce0328a3"},"outputs":[{"output_type":"stream","name":"stdout","text":["Sentiment: Positive\n"]}],"source":["# Sample positive and negative words\n","positive_words = set(['good', 'awesome', 'excellent', 'happy', 'positive'])\n","negative_words = set(['bad', 'terrible', 'poor', 'unhappy', 'negative'])\n","\n","def rule_based_sentiment_analysis(text):\n"," # Tokenize the text\n"," tokens = word_tokenize(text.lower())\n","\n"," # Remove stopwords\n"," stop_words = set(stopwords.words('english'))\n"," tokens = [word for word in tokens if word.isalnum() and word not in stop_words] #alnum = alphanumeric\n","\n"," # Calculate sentiment score\n"," sentiment_score = sum(1 for word in tokens if word in positive_words) - sum(1 for word in tokens if word in negative_words)\n","\n"," # Classify sentiment\n"," if sentiment_score > 0:\n"," return 'Positive'\n"," elif sentiment_score < 0:\n"," return 'Negative'\n"," else:\n"," return 'Neutral'\n","\n","# Example usage\n","text_to_analyze = \"I had a good experience with the product. Highly recommended!\"\n","sentiment_result = rule_based_sentiment_analysis(text_to_analyze)\n","print(f\"Sentiment: {sentiment_result}\")"]},{"cell_type":"markdown","id":"21764069-0b07-4b3e-8103-b2ab464a9182","metadata":{"tags":[],"id":"21764069-0b07-4b3e-8103-b2ab464a9182"},"source":["## Machine Learning Approaches"]},{"cell_type":"markdown","id":"dc739c8a-a453-43d1-bdc5-ad10d823d748","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"dc739c8a-a453-43d1-bdc5-ad10d823d748"},"source":["### Import packages"]},{"cell_type":"code","execution_count":17,"id":"7e030b97-e111-45ea-b00f-09a360f3400e","metadata":{"tags":[],"id":"7e030b97-e111-45ea-b00f-09a360f3400e","executionInfo":{"status":"ok","timestamp":1713841657541,"user_tz":-420,"elapsed":720,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["import pandas as pd\n","from sklearn.pipeline import Pipeline\n","from sklearn.utils import shuffle\n","from sklearn.model_selection import train_test_split\n","from sklearn.feature_extraction.text import TfidfVectorizer\n","# from sklearn.svm import SVC\n","from sklearn.naive_bayes import MultinomialNB\n","from sklearn.metrics import classification_report, confusion_matrix\n","\n"]},{"cell_type":"markdown","id":"54c4fe66-f52f-487f-bfd5-0ea6e05206ce","metadata":{"tags":[],"id":"54c4fe66-f52f-487f-bfd5-0ea6e05206ce"},"source":["### TF-IDF vectorizer"]},{"cell_type":"markdown","id":"3f5b7e92-5de4-4894-b2be-47dac1cf2482","metadata":{"id":"3f5b7e92-5de4-4894-b2be-47dac1cf2482"},"source":["\n","<div>\n","<img src=\"https://www.kdnuggets.com/wp-content/uploads/awan_convert_text_documents_tfidf_matrix_tfidfvectorizer_3.png\" width=\"590\"/>\n","</div>\n","\n","\n","Image sources: https://www.kdnuggets.com/2022/09/convert-text-documents-tfidf-matrix-tfidfvectorizer.html\n","\n","\n","\n","\n"]},{"cell_type":"markdown","id":"9bd125fc-11fd-414a-b8f0-ff7ef628fb94","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"9bd125fc-11fd-414a-b8f0-ff7ef628fb94"},"source":["##### Example on Small data"]},{"cell_type":"code","execution_count":18,"id":"8a61fdce-6544-4774-bc29-265bf4afaa90","metadata":{"tags":[],"id":"8a61fdce-6544-4774-bc29-265bf4afaa90","executionInfo":{"status":"ok","timestamp":1713841845540,"user_tz":-420,"elapsed":360,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["\n","\n","# Sample data\n","documents = [\n"," \"This is the first document.\",\n"," \"This document is the second document.\",\n"," \"And this is the third one.\",\n"," \"Is this the first document?\"\n","]"]},{"cell_type":"code","execution_count":19,"id":"5794027b-2bee-46d9-9b4d-9cbaa7c4120f","metadata":{"tags":[],"id":"5794027b-2bee-46d9-9b4d-9cbaa7c4120f","executionInfo":{"status":"ok","timestamp":1713841849693,"user_tz":-420,"elapsed":471,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# Create a DataFrame for better visualization\n","df = pd.DataFrame({'Text': documents})"]},{"cell_type":"code","source":["df"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":175},"id":"Wje-T5kT712V","executionInfo":{"status":"ok","timestamp":1713841863619,"user_tz":-420,"elapsed":422,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"96738978-cc1b-4565-f336-173f2a348453"},"id":"Wje-T5kT712V","execution_count":20,"outputs":[{"output_type":"execute_result","data":{"text/plain":[" Text\n","0 This is the first document.\n","1 This document is the second document.\n","2 And this is the third one.\n","3 Is this the first document?"],"text/html":["\n"," <div id=\"df-a66940df-0fc7-4bfe-82ac-69f3b0c52155\" class=\"colab-df-container\">\n"," <div>\n","<style scoped>\n"," .dataframe tbody tr th:only-of-type {\n"," vertical-align: middle;\n"," }\n","\n"," .dataframe tbody tr th {\n"," vertical-align: top;\n"," }\n","\n"," .dataframe thead th {\n"," text-align: right;\n"," }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n"," <thead>\n"," <tr style=\"text-align: right;\">\n"," <th></th>\n"," <th>Text</th>\n"," </tr>\n"," </thead>\n"," <tbody>\n"," <tr>\n"," <th>0</th>\n"," <td>This is the first document.</td>\n"," </tr>\n"," <tr>\n"," <th>1</th>\n"," <td>This document is the second document.</td>\n"," </tr>\n"," <tr>\n"," <th>2</th>\n"," <td>And this is the third one.</td>\n"," </tr>\n"," <tr>\n"," <th>3</th>\n"," <td>Is this the first document?</td>\n"," </tr>\n"," </tbody>\n","</table>\n","</div>\n"," <div class=\"colab-df-buttons\">\n","\n"," <div class=\"colab-df-container\">\n"," <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-a66940df-0fc7-4bfe-82ac-69f3b0c52155')\"\n"," title=\"Convert this dataframe to an interactive table.\"\n"," style=\"display:none;\">\n","\n"," <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n"," <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n"," </svg>\n"," </button>\n","\n"," <style>\n"," .colab-df-container {\n"," display:flex;\n"," gap: 12px;\n"," }\n","\n"," .colab-df-convert {\n"," background-color: #E8F0FE;\n"," border: none;\n"," border-radius: 50%;\n"," cursor: pointer;\n"," display: none;\n"," fill: #1967D2;\n"," height: 32px;\n"," padding: 0 0 0 0;\n"," width: 32px;\n"," }\n","\n"," .colab-df-convert:hover {\n"," background-color: #E2EBFA;\n"," box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n"," fill: #174EA6;\n"," }\n","\n"," .colab-df-buttons div {\n"," margin-bottom: 4px;\n"," }\n","\n"," [theme=dark] .colab-df-convert {\n"," background-color: #3B4455;\n"," fill: #D2E3FC;\n"," }\n","\n"," [theme=dark] .colab-df-convert:hover {\n"," background-color: #434B5C;\n"," box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n"," filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n"," fill: #FFFFFF;\n"," }\n"," </style>\n","\n"," <script>\n"," const buttonEl =\n"," document.querySelector('#df-a66940df-0fc7-4bfe-82ac-69f3b0c52155 button.colab-df-convert');\n"," buttonEl.style.display =\n"," google.colab.kernel.accessAllowed ? 'block' : 'none';\n","\n"," async function convertToInteractive(key) {\n"," const element = document.querySelector('#df-a66940df-0fc7-4bfe-82ac-69f3b0c52155');\n"," const dataTable =\n"," await google.colab.kernel.invokeFunction('convertToInteractive',\n"," [key], {});\n"," if (!dataTable) return;\n","\n"," const docLinkHtml = 'Like what you see? Visit the ' +\n"," '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n"," + ' to learn more about interactive tables.';\n"," element.innerHTML = '';\n"," dataTable['output_type'] = 'display_data';\n"," await google.colab.output.renderOutput(dataTable, element);\n"," const docLink = document.createElement('div');\n"," docLink.innerHTML = docLinkHtml;\n"," element.appendChild(docLink);\n"," }\n"," </script>\n"," </div>\n","\n","\n","<div id=\"df-a349aca5-128d-48ef-b973-1f625f3c942c\">\n"," <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-a349aca5-128d-48ef-b973-1f625f3c942c')\"\n"," title=\"Suggest charts\"\n"," style=\"display:none;\">\n","\n","<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n"," width=\"24px\">\n"," <g>\n"," <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n"," </g>\n","</svg>\n"," </button>\n","\n","<style>\n"," .colab-df-quickchart {\n"," --bg-color: #E8F0FE;\n"," --fill-color: #1967D2;\n"," --hover-bg-color: #E2EBFA;\n"," --hover-fill-color: #174EA6;\n"," --disabled-fill-color: #AAA;\n"," --disabled-bg-color: #DDD;\n"," }\n","\n"," [theme=dark] .colab-df-quickchart {\n"," --bg-color: #3B4455;\n"," --fill-color: #D2E3FC;\n"," --hover-bg-color: #434B5C;\n"," --hover-fill-color: #FFFFFF;\n"," --disabled-bg-color: #3B4455;\n"," --disabled-fill-color: #666;\n"," }\n","\n"," .colab-df-quickchart {\n"," background-color: var(--bg-color);\n"," border: none;\n"," border-radius: 50%;\n"," cursor: pointer;\n"," display: none;\n"," fill: var(--fill-color);\n"," height: 32px;\n"," padding: 0;\n"," width: 32px;\n"," }\n","\n"," .colab-df-quickchart:hover {\n"," background-color: var(--hover-bg-color);\n"," box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n"," fill: var(--button-hover-fill-color);\n"," }\n","\n"," .colab-df-quickchart-complete:disabled,\n"," .colab-df-quickchart-complete:disabled:hover {\n"," background-color: var(--disabled-bg-color);\n"," fill: var(--disabled-fill-color);\n"," box-shadow: none;\n"," }\n","\n"," .colab-df-spinner {\n"," border: 2px solid var(--fill-color);\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," animation:\n"," spin 1s steps(1) infinite;\n"," }\n","\n"," @keyframes spin {\n"," 0% {\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," border-left-color: var(--fill-color);\n"," }\n"," 20% {\n"," border-color: transparent;\n"," border-left-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," }\n"," 30% {\n"," border-color: transparent;\n"," border-left-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," border-right-color: var(--fill-color);\n"," }\n"," 40% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," }\n"," 60% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," }\n"," 80% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," border-bottom-color: var(--fill-color);\n"," }\n"," 90% {\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," }\n"," }\n","</style>\n","\n"," <script>\n"," async function quickchart(key) {\n"," const quickchartButtonEl =\n"," document.querySelector('#' + key + ' button');\n"," quickchartButtonEl.disabled = true; // To prevent multiple clicks.\n"," quickchartButtonEl.classList.add('colab-df-spinner');\n"," try {\n"," const charts = await google.colab.kernel.invokeFunction(\n"," 'suggestCharts', [key], {});\n"," } catch (error) {\n"," console.error('Error during call to suggestCharts:', error);\n"," }\n"," quickchartButtonEl.classList.remove('colab-df-spinner');\n"," quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n"," }\n"," (() => {\n"," let quickchartButtonEl =\n"," document.querySelector('#df-a349aca5-128d-48ef-b973-1f625f3c942c button');\n"," quickchartButtonEl.style.display =\n"," google.colab.kernel.accessAllowed ? 'block' : 'none';\n"," })();\n"," </script>\n","</div>\n"," </div>\n"," </div>\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"df","summary":"{\n \"name\": \"df\",\n \"rows\": 4,\n \"fields\": [\n {\n \"column\": \"Text\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"This document is the second document.\",\n \"Is this the first document?\",\n \"This is the first document.\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"}},"metadata":{},"execution_count":20}]},{"cell_type":"code","execution_count":21,"id":"b49d5272-0383-4e39-910b-87276c4ffca2","metadata":{"tags":[],"id":"b49d5272-0383-4e39-910b-87276c4ffca2","executionInfo":{"status":"ok","timestamp":1713841867905,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# TF-IDF vectorization\n","vectorizer = TfidfVectorizer()\n","tfidf_matrix = vectorizer.fit_transform(df['Text'].tolist())"]},{"cell_type":"code","execution_count":22,"id":"46c0b47d-80ab-498b-91a2-7202f1c429fd","metadata":{"tags":[],"id":"46c0b47d-80ab-498b-91a2-7202f1c429fd","executionInfo":{"status":"ok","timestamp":1713841872560,"user_tz":-420,"elapsed":320,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# Convert the TF-IDF matrix to a DataFrame\n","tfidf_df = pd.DataFrame(tfidf_matrix.toarray(), columns=vectorizer.get_feature_names_out())"]},{"cell_type":"code","execution_count":23,"id":"91c2bee0-5bb6-44b9-a609-1f3d0e891ad4","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"91c2bee0-5bb6-44b9-a609-1f3d0e891ad4","executionInfo":{"status":"ok","timestamp":1713841877895,"user_tz":-420,"elapsed":339,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"cdd8422d-bf3a-42c1-a476-2b15d7f37157"},"outputs":[{"output_type":"stream","name":"stdout","text":["Original Data:\n"," Text\n","0 This is the first document.\n","1 This document is the second document.\n","2 And this is the third one.\n","3 Is this the first document?\n"]}],"source":["# Print the original data\n","print(\"Original Data:\")\n","print(df)"]},{"cell_type":"code","execution_count":24,"id":"24c4a522-8ef4-4001-ada6-031a043b9a54","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"24c4a522-8ef4-4001-ada6-031a043b9a54","executionInfo":{"status":"ok","timestamp":1713841882847,"user_tz":-420,"elapsed":344,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2606fbf1-fe41-4e03-899b-5d3f2776685f"},"outputs":[{"output_type":"stream","name":"stdout","text":[" (0, 1)\t0.46979138557992045\n"," (0, 2)\t0.5802858236844359\n"," (0, 6)\t0.38408524091481483\n"," (0, 3)\t0.38408524091481483\n"," (0, 8)\t0.38408524091481483\n"," (1, 5)\t0.5386476208856763\n"," (1, 1)\t0.6876235979836938\n"," (1, 6)\t0.281088674033753\n"," (1, 3)\t0.281088674033753\n"," (1, 8)\t0.281088674033753\n"," (2, 4)\t0.511848512707169\n"," (2, 7)\t0.511848512707169\n"," (2, 0)\t0.511848512707169\n"," (2, 6)\t0.267103787642168\n"," (2, 3)\t0.267103787642168\n"," (2, 8)\t0.267103787642168\n"," (3, 1)\t0.46979138557992045\n"," (3, 2)\t0.5802858236844359\n"," (3, 6)\t0.38408524091481483\n"," (3, 3)\t0.38408524091481483\n"," (3, 8)\t0.38408524091481483\n"]}],"source":["print(tfidf_matrix)"]},{"cell_type":"code","execution_count":25,"id":"6feb5892-284f-43d1-ab7b-5b13dbfadd0b","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"6feb5892-284f-43d1-ab7b-5b13dbfadd0b","executionInfo":{"status":"ok","timestamp":1713841924141,"user_tz":-420,"elapsed":341,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"0df619c6-eb05-43a0-da9d-7c0d3c0326b7"},"outputs":[{"output_type":"stream","name":"stdout","text":["\n","TF-IDF Matrix:\n"," and document first is one second the \\\n","0 0.000000 0.469791 0.580286 0.384085 0.000000 0.000000 0.384085 \n","1 0.000000 0.687624 0.000000 0.281089 0.000000 0.538648 0.281089 \n","2 0.511849 0.000000 0.000000 0.267104 0.511849 0.000000 0.267104 \n","3 0.000000 0.469791 0.580286 0.384085 0.000000 0.000000 0.384085 \n","\n"," third this \n","0 0.000000 0.384085 \n","1 0.000000 0.281089 \n","2 0.511849 0.267104 \n","3 0.000000 0.384085 \n"]}],"source":["# Print the TF-IDF matrix\n","print(\"\\nTF-IDF Matrix:\")\n","print(tfidf_df)"]},{"cell_type":"markdown","id":"6802c239-edfa-462e-99ea-31386fd7aed4","metadata":{"tags":[],"id":"6802c239-edfa-462e-99ea-31386fd7aed4"},"source":["## Naive Bayes classifier trained on the TF-IDF features."]},{"cell_type":"markdown","id":"3accf6f8-6cae-4265-8d5d-fb5d40a07a2d","metadata":{"id":"3accf6f8-6cae-4265-8d5d-fb5d40a07a2d"},"source":["<div>\n","<img src=\"https://lh3.googleusercontent.com/pw/AP1GczOBxYJIFFWIiKJfFMdSp10-P1FNc6fZx7Wxa2NKpgw36p0Lady_mBMgxnKXS4cRbHwH2rnItp3cjvgIYdAN_LDcLlEzf1-8AJ62ybBOEGe8QKyH-CAojll13TKEDAo3yxwKvDh7wJRv2Rf1u7wWTjDI=w1911-h485-s-no-gm?authuser=0\" width=\"800\"/>\n","</div>\n"]},{"cell_type":"markdown","id":"9062063a-557b-4971-ad84-e3601b1a520e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"9062063a-557b-4971-ad84-e3601b1a520e"},"source":["### Read data/Preparation"]},{"cell_type":"code","execution_count":26,"id":"8d2eab09-03c7-441e-9c78-0c2e069f4d25","metadata":{"tags":[],"id":"8d2eab09-03c7-441e-9c78-0c2e069f4d25","executionInfo":{"status":"ok","timestamp":1713843412522,"user_tz":-420,"elapsed":3570,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["# df = pd.read_csv(\"Womens_Clothing_E_Commerce_Reviews.csv\")\n","df = pd.read_csv(\"imdb_reviews.csv\")"]},{"cell_type":"code","execution_count":27,"id":"aca597f3-c8da-4314-990e-253d5ed719da","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"aca597f3-c8da-4314-990e-253d5ed719da","executionInfo":{"status":"ok","timestamp":1713843417599,"user_tz":-420,"elapsed":381,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"1bc779d8-5cb6-4263-cfde-29f2a9ce6e82"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["(50000, 2)"]},"metadata":{},"execution_count":27}],"source":["df.shape"]},{"cell_type":"code","execution_count":28,"id":"7d8131e4-4a69-45af-aa12-335c926e308f","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":143},"id":"7d8131e4-4a69-45af-aa12-335c926e308f","executionInfo":{"status":"ok","timestamp":1713843430104,"user_tz":-420,"elapsed":994,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"03ebe55c-6c56-4084-cf22-0d4c48626788"},"outputs":[{"output_type":"execute_result","data":{"text/plain":[" text label\n","0 One of the other reviewers has mentioned that ... positive\n","1 A wonderful little production. <br /><br />The... positive\n","2 I thought this was a wonderful way to spend ti... positive"],"text/html":["\n"," <div id=\"df-ea50fdb4-e951-4e4b-be83-2b339db320c3\" class=\"colab-df-container\">\n"," <div>\n","<style scoped>\n"," .dataframe tbody tr th:only-of-type {\n"," vertical-align: middle;\n"," }\n","\n"," .dataframe tbody tr th {\n"," vertical-align: top;\n"," }\n","\n"," .dataframe thead th {\n"," text-align: right;\n"," }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n"," <thead>\n"," <tr style=\"text-align: right;\">\n"," <th></th>\n"," <th>text</th>\n"," <th>label</th>\n"," </tr>\n"," </thead>\n"," <tbody>\n"," <tr>\n"," <th>0</th>\n"," <td>One of the other reviewers has mentioned that ...</td>\n"," <td>positive</td>\n"," </tr>\n"," <tr>\n"," <th>1</th>\n"," <td>A wonderful little production. <br /><br />The...</td>\n"," <td>positive</td>\n"," </tr>\n"," <tr>\n"," <th>2</th>\n"," <td>I thought this was a wonderful way to spend ti...</td>\n"," <td>positive</td>\n"," </tr>\n"," </tbody>\n","</table>\n","</div>\n"," <div class=\"colab-df-buttons\">\n","\n"," <div class=\"colab-df-container\">\n"," <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-ea50fdb4-e951-4e4b-be83-2b339db320c3')\"\n"," title=\"Convert this dataframe to an interactive table.\"\n"," style=\"display:none;\">\n","\n"," <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\" viewBox=\"0 -960 960 960\">\n"," <path d=\"M120-120v-720h720v720H120Zm60-500h600v-160H180v160Zm220 220h160v-160H400v160Zm0 220h160v-160H400v160ZM180-400h160v-160H180v160Zm440 0h160v-160H620v160ZM180-180h160v-160H180v160Zm440 0h160v-160H620v160Z\"/>\n"," </svg>\n"," </button>\n","\n"," <style>\n"," .colab-df-container {\n"," display:flex;\n"," gap: 12px;\n"," }\n","\n"," .colab-df-convert {\n"," background-color: #E8F0FE;\n"," border: none;\n"," border-radius: 50%;\n"," cursor: pointer;\n"," display: none;\n"," fill: #1967D2;\n"," height: 32px;\n"," padding: 0 0 0 0;\n"," width: 32px;\n"," }\n","\n"," .colab-df-convert:hover {\n"," background-color: #E2EBFA;\n"," box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n"," fill: #174EA6;\n"," }\n","\n"," .colab-df-buttons div {\n"," margin-bottom: 4px;\n"," }\n","\n"," [theme=dark] .colab-df-convert {\n"," background-color: #3B4455;\n"," fill: #D2E3FC;\n"," }\n","\n"," [theme=dark] .colab-df-convert:hover {\n"," background-color: #434B5C;\n"," box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n"," filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n"," fill: #FFFFFF;\n"," }\n"," </style>\n","\n"," <script>\n"," const buttonEl =\n"," document.querySelector('#df-ea50fdb4-e951-4e4b-be83-2b339db320c3 button.colab-df-convert');\n"," buttonEl.style.display =\n"," google.colab.kernel.accessAllowed ? 'block' : 'none';\n","\n"," async function convertToInteractive(key) {\n"," const element = document.querySelector('#df-ea50fdb4-e951-4e4b-be83-2b339db320c3');\n"," const dataTable =\n"," await google.colab.kernel.invokeFunction('convertToInteractive',\n"," [key], {});\n"," if (!dataTable) return;\n","\n"," const docLinkHtml = 'Like what you see? Visit the ' +\n"," '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n"," + ' to learn more about interactive tables.';\n"," element.innerHTML = '';\n"," dataTable['output_type'] = 'display_data';\n"," await google.colab.output.renderOutput(dataTable, element);\n"," const docLink = document.createElement('div');\n"," docLink.innerHTML = docLinkHtml;\n"," element.appendChild(docLink);\n"," }\n"," </script>\n"," </div>\n","\n","\n","<div id=\"df-1d88a78d-63c4-4def-85a3-c5435003219b\">\n"," <button class=\"colab-df-quickchart\" onclick=\"quickchart('df-1d88a78d-63c4-4def-85a3-c5435003219b')\"\n"," title=\"Suggest charts\"\n"," style=\"display:none;\">\n","\n","<svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n"," width=\"24px\">\n"," <g>\n"," <path d=\"M19 3H5c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V5c0-1.1-.9-2-2-2zM9 17H7v-7h2v7zm4 0h-2V7h2v10zm4 0h-2v-4h2v4z\"/>\n"," </g>\n","</svg>\n"," </button>\n","\n","<style>\n"," .colab-df-quickchart {\n"," --bg-color: #E8F0FE;\n"," --fill-color: #1967D2;\n"," --hover-bg-color: #E2EBFA;\n"," --hover-fill-color: #174EA6;\n"," --disabled-fill-color: #AAA;\n"," --disabled-bg-color: #DDD;\n"," }\n","\n"," [theme=dark] .colab-df-quickchart {\n"," --bg-color: #3B4455;\n"," --fill-color: #D2E3FC;\n"," --hover-bg-color: #434B5C;\n"," --hover-fill-color: #FFFFFF;\n"," --disabled-bg-color: #3B4455;\n"," --disabled-fill-color: #666;\n"," }\n","\n"," .colab-df-quickchart {\n"," background-color: var(--bg-color);\n"," border: none;\n"," border-radius: 50%;\n"," cursor: pointer;\n"," display: none;\n"," fill: var(--fill-color);\n"," height: 32px;\n"," padding: 0;\n"," width: 32px;\n"," }\n","\n"," .colab-df-quickchart:hover {\n"," background-color: var(--hover-bg-color);\n"," box-shadow: 0 1px 2px rgba(60, 64, 67, 0.3), 0 1px 3px 1px rgba(60, 64, 67, 0.15);\n"," fill: var(--button-hover-fill-color);\n"," }\n","\n"," .colab-df-quickchart-complete:disabled,\n"," .colab-df-quickchart-complete:disabled:hover {\n"," background-color: var(--disabled-bg-color);\n"," fill: var(--disabled-fill-color);\n"," box-shadow: none;\n"," }\n","\n"," .colab-df-spinner {\n"," border: 2px solid var(--fill-color);\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," animation:\n"," spin 1s steps(1) infinite;\n"," }\n","\n"," @keyframes spin {\n"," 0% {\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," border-left-color: var(--fill-color);\n"," }\n"," 20% {\n"," border-color: transparent;\n"," border-left-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," }\n"," 30% {\n"," border-color: transparent;\n"," border-left-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," border-right-color: var(--fill-color);\n"," }\n"," 40% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," border-top-color: var(--fill-color);\n"," }\n"," 60% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," }\n"," 80% {\n"," border-color: transparent;\n"," border-right-color: var(--fill-color);\n"," border-bottom-color: var(--fill-color);\n"," }\n"," 90% {\n"," border-color: transparent;\n"," border-bottom-color: var(--fill-color);\n"," }\n"," }\n","</style>\n","\n"," <script>\n"," async function quickchart(key) {\n"," const quickchartButtonEl =\n"," document.querySelector('#' + key + ' button');\n"," quickchartButtonEl.disabled = true; // To prevent multiple clicks.\n"," quickchartButtonEl.classList.add('colab-df-spinner');\n"," try {\n"," const charts = await google.colab.kernel.invokeFunction(\n"," 'suggestCharts', [key], {});\n"," } catch (error) {\n"," console.error('Error during call to suggestCharts:', error);\n"," }\n"," quickchartButtonEl.classList.remove('colab-df-spinner');\n"," quickchartButtonEl.classList.add('colab-df-quickchart-complete');\n"," }\n"," (() => {\n"," let quickchartButtonEl =\n"," document.querySelector('#df-1d88a78d-63c4-4def-85a3-c5435003219b button');\n"," quickchartButtonEl.style.display =\n"," google.colab.kernel.accessAllowed ? 'block' : 'none';\n"," })();\n"," </script>\n","</div>\n"," </div>\n"," </div>\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"df","summary":"{\n \"name\": \"df\",\n \"rows\": 50000,\n \"fields\": [\n {\n \"column\": \"text\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 49582,\n \"samples\": [\n \"\\\"Soul Plane\\\" is a horrible attempt at comedy that only should appeal people with thick skulls, bloodshot eyes and furry pawns. <br /><br />The plot is not only incoherent but also non-existent, acting is mostly sub sub-par with a gang of highly moronic and dreadful characters thrown in for bad measure, jokes are often spotted miles ahead and almost never even a bit amusing. This movie lacks any structure and is full of racial stereotypes that must have seemed old even in the fifties, the only thing it really has going for it is some pretty ladies, but really, if you want that you can rent something from the \\\"Adult\\\" section. OK?<br /><br />I can hardly see anything here to recommend since you'll probably have a lot a better and productive time chasing rats with a sledgehammer or inventing waterproof teabags or whatever.<br /><br />2/10\",\n \"Guest from the Future tells a fascinating story of time travel, friendship, battle of good and evil -- all with a small budget, child actors, and few special effects. Something for Spielberg and Lucas to learn from. ;) A sixth-grader Kolya \\\"Nick\\\" Gerasimov finds a time machine in the basement of a decrepit building and travels 100 years into the future. He discovers a near-perfect, utopian society where robots play guitars and write poetry, everyone is kind to each other and people enjoy everything technology has to offer. Alice is the daughter of a prominent scientist who invented a device called Mielophone that allows to read minds of humans and animals. The device can be put to both good and bad use, depending on whose hands it falls into. When two evil space pirates from Saturn who want to rule the universe attempt to steal Mielophone, it falls into the hands of 20th century school boy Nick. With the pirates hot on his tracks, he travels back to his time, followed by the pirates, and Alice. Chaos, confusion and funny situations follow as the luckless pirates try to blend in with the earthlings. Alice enrolls in the same school Nick goes to and demonstrates superhuman abilities in PE class. The catch is, Alice doesn't know what Nick looks like, while the pirates do. Also, the pirates are able to change their appearance and turn literally into anyone. (Hmm, I wonder if this is where James Cameron got the idea for Terminator...) Who gets to Nick -- and Mielophone -- first? Excellent plot, non-stop adventures, and great soundtrack. I wish Hollywood made kid movies like this one...\",\n \"\\\"National Treasure\\\" (2004) is a thoroughly misguided hodge-podge of plot entanglements that borrow from nearly every cloak and dagger government conspiracy clich\\u00e9 that has ever been written. The film stars Nicholas Cage as Benjamin Franklin Gates (how precious is that, I ask you?); a seemingly normal fellow who, for no other reason than being of a lineage of like-minded misguided fortune hunters, decides to steal a 'national treasure' that has been hidden by the United States founding fathers. After a bit of subtext and background that plays laughably (unintentionally) like Indiana Jones meets The Patriot, the film degenerates into one misguided whimsy after another \\u0096 attempting to create a 'Stanley Goodspeed' regurgitation of Nicholas Cage and launch the whole convoluted mess forward with a series of high octane, but disconnected misadventures.<br /><br />The relevancy and logic to having George Washington and his motley crew of patriots burying a king's ransom someplace on native soil, and then, going through the meticulous plan of leaving clues scattered throughout U.S. currency art work, is something that director Jon Turteltaub never quite gets around to explaining. Couldn't Washington found better usage for such wealth during the start up of the country? Hence, we are left with a mystery built on top of an enigma that is already on shaky ground by the time Ben appoints himself the new custodian of this untold wealth. Ben's intentions are noble \\u0096 if confusing. He's set on protecting the treasure. For who and when?\\u0085your guess is as good as mine.<br /><br />But there are a few problems with Ben's crusade. First up, his friend, Ian Holmes (Sean Bean) decides that he can't wait for Ben to make up his mind about stealing the Declaration of Independence from the National Archives (oh, yeah \\u0096 brilliant idea!). Presumably, the back of that famous document holds the secret answer to the ultimate fortune. So Ian tries to kill Ben. The assassination attempt is, of course, unsuccessful, if overly melodramatic. It also affords Ben the opportunity to pick up, and pick on, the very sultry curator of the archives, Abigail Chase (Diane Kruger). She thinks Ben is clearly a nut \\u0096 at least at the beginning. But true to action/romance form, Abby's resolve melts quicker than you can say, \\\"is that the Hope Diamond?\\\" The film moves into full X-File-ish mode, as the FBI, mistakenly believing that Ben is behind the theft, retaliate in various benign ways that lead to a multi-layering of action sequences reminiscent of Mission Impossible meets The Fugitive. Honestly, don't those guys ever get 'intelligence' information that is correct? In the final analysis, \\\"National Treasure\\\" isn't great film making, so much as it's a patchwork rehash of tired old bits from other movies, woven together from scraps, the likes of which would make IL' Betsy Ross blush.<br /><br />The Buena Vista DVD delivers a far more generous treatment than this film is deserving of. The anamorphic widescreen picture exhibits a very smooth and finely detailed image with very rich colors, natural flesh tones, solid blacks and clean whites. The stylized image is also free of blemishes and digital enhancements. The audio is 5.1 and delivers a nice sonic boom to your side and rear speakers with intensity and realism. Extras include a host of promotional junket material that is rather deep and over the top in its explanation of how and why this film was made. If only, as an audience, we had had more clarification as to why Ben and co. were chasing after an illusive treasure, this might have been one good flick. Extras conclude with the theatrical trailer, audio commentary and deleted scenes. Not for the faint-hearted \\u0096 just the thick-headed.\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"label\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"negative\",\n \"positive\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"}},"metadata":{},"execution_count":28}],"source":["df.head(3)"]},{"cell_type":"code","execution_count":29,"id":"43a27caf-779b-4bd1-a3cf-fa641021172e","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"43a27caf-779b-4bd1-a3cf-fa641021172e","executionInfo":{"status":"ok","timestamp":1713843524562,"user_tz":-420,"elapsed":334,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fd1bd6c8-a340-49a2-deb8-e3a00e217a34"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["array(['positive', 'negative'], dtype=object)"]},"metadata":{},"execution_count":29}],"source":["df['label'].unique()"]},{"cell_type":"code","execution_count":null,"id":"c72dd5ec-59b2-4c7f-a8fb-fdade866984d","metadata":{"tags":[],"id":"c72dd5ec-59b2-4c7f-a8fb-fdade866984d"},"outputs":[],"source":["df['label'].unique()"]},{"cell_type":"code","execution_count":30,"id":"ba556f9b-da1c-4d13-8d70-563e0bd528a1","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"ba556f9b-da1c-4d13-8d70-563e0bd528a1","executionInfo":{"status":"ok","timestamp":1713843636003,"user_tz":-420,"elapsed":322,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"85b8ee33-108a-44b9-d395-e372c1b99b79"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["text 0\n","label 0\n","dtype: int64"]},"metadata":{},"execution_count":30}],"source":["df.isna().sum()"]},{"cell_type":"markdown","id":"819c31c3-873d-4d31-a21a-759059bd4c6d","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"819c31c3-873d-4d31-a21a-759059bd4c6d"},"source":["### Split the dataset into training and testing sets"]},{"cell_type":"code","execution_count":31,"id":"6ca318a2-26d7-446e-8324-6660171f239d","metadata":{"tags":[],"id":"6ca318a2-26d7-446e-8324-6660171f239d","executionInfo":{"status":"ok","timestamp":1713843687000,"user_tz":-420,"elapsed":1205,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["train_data, test_data, train_labels, test_labels = train_test_split(df['text'], df['label'], test_size=0.3, random_state=42)"]},{"cell_type":"code","execution_count":32,"id":"f0cfc8fc-49e5-4c88-bb33-8084dcf00100","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"f0cfc8fc-49e5-4c88-bb33-8084dcf00100","executionInfo":{"status":"ok","timestamp":1713843694590,"user_tz":-420,"elapsed":329,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"767e8a04-ed3d-466f-a935-15eab7cdb83f"},"outputs":[{"output_type":"stream","name":"stdout","text":["38094 As much as I love trains, I couldn't stomach t...\n","40624 This was a very good PPV, but like Wrestlemani...\n","49425 Not finding the right words is everybody's pro...\n","35734 I'm really suprised this movie didn't get a hi...\n","41708 I'll start by confessing that I tend to really...\n"," ... \n","11284 `Shadow Magic' recaptures the joy and amazemen...\n","44732 I found this movie to be quite enjoyable and f...\n","38158 Avoid this one! It is a terrible movie. So wha...\n","860 This production was quite a surprise for me. I...\n","15795 This is a decent movie. Although little bit sh...\n","Name: text, Length: 35000, dtype: object\n"]}],"source":["print(train_data)"]},{"cell_type":"code","execution_count":33,"id":"51d0a415-4982-43dd-8864-c189ba6826f4","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"51d0a415-4982-43dd-8864-c189ba6826f4","executionInfo":{"status":"ok","timestamp":1713843697940,"user_tz":-420,"elapsed":311,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"8167d4df-179d-4cf9-bf14-9112184e98be"},"outputs":[{"output_type":"stream","name":"stdout","text":["38094 negative\n","40624 positive\n","49425 negative\n","35734 positive\n","41708 negative\n"," ... \n","11284 positive\n","44732 positive\n","38158 negative\n","860 positive\n","15795 positive\n","Name: label, Length: 35000, dtype: object\n"]}],"source":["print(train_labels)"]},{"cell_type":"markdown","id":"42987cdb-4cdf-46df-95d8-7c2b2824c1ee","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"42987cdb-4cdf-46df-95d8-7c2b2824c1ee"},"source":["### Create a pipeline"]},{"cell_type":"code","execution_count":34,"id":"06ffd548-c333-4c1a-87ce-9699ddd116ee","metadata":{"tags":[],"id":"06ffd548-c333-4c1a-87ce-9699ddd116ee","executionInfo":{"status":"ok","timestamp":1713843715911,"user_tz":-420,"elapsed":333,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["sentiment_pipeline = Pipeline([\n"," ('tfidf', TfidfVectorizer()),\n"," ('nb', MultinomialNB())\n","])"]},{"cell_type":"markdown","id":"6bafa7cd-8d0b-4725-bd40-4a3b04634fab","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"6bafa7cd-8d0b-4725-bd40-4a3b04634fab"},"source":["### Train the model using the pipeline"]},{"cell_type":"code","execution_count":35,"id":"712dea09-52c2-4a9f-8bf9-3cbb273fe4b5","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":126},"id":"712dea09-52c2-4a9f-8bf9-3cbb273fe4b5","executionInfo":{"status":"ok","timestamp":1713844075138,"user_tz":-420,"elapsed":9437,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"fda94af1-772d-4175-ee65-ab856819dea7"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["Pipeline(steps=[('tfidf', TfidfVectorizer()), ('nb', MultinomialNB())])"],"text/html":["<style>#sk-container-id-1 {color: black;background-color: white;}#sk-container-id-1 pre{padding: 0;}#sk-container-id-1 div.sk-toggleable {background-color: white;}#sk-container-id-1 label.sk-toggleable__label {cursor: pointer;display: block;width: 100%;margin-bottom: 0;padding: 0.3em;box-sizing: border-box;text-align: center;}#sk-container-id-1 label.sk-toggleable__label-arrow:before {content: \"βΈ\";float: left;margin-right: 0.25em;color: #696969;}#sk-container-id-1 label.sk-toggleable__label-arrow:hover:before {color: black;}#sk-container-id-1 div.sk-estimator:hover label.sk-toggleable__label-arrow:before {color: black;}#sk-container-id-1 div.sk-toggleable__content {max-height: 0;max-width: 0;overflow: hidden;text-align: left;background-color: #f0f8ff;}#sk-container-id-1 div.sk-toggleable__content pre {margin: 0.2em;color: black;border-radius: 0.25em;background-color: #f0f8ff;}#sk-container-id-1 input.sk-toggleable__control:checked~div.sk-toggleable__content {max-height: 200px;max-width: 100%;overflow: auto;}#sk-container-id-1 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {content: \"βΎ\";}#sk-container-id-1 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 input.sk-hidden--visually {border: 0;clip: rect(1px 1px 1px 1px);clip: rect(1px, 1px, 1px, 1px);height: 1px;margin: -1px;overflow: hidden;padding: 0;position: absolute;width: 1px;}#sk-container-id-1 div.sk-estimator {font-family: monospace;background-color: #f0f8ff;border: 1px dotted black;border-radius: 0.25em;box-sizing: border-box;margin-bottom: 0.5em;}#sk-container-id-1 div.sk-estimator:hover {background-color: #d4ebff;}#sk-container-id-1 div.sk-parallel-item::after {content: \"\";width: 100%;border-bottom: 1px solid gray;flex-grow: 1;}#sk-container-id-1 div.sk-label:hover label.sk-toggleable__label {background-color: #d4ebff;}#sk-container-id-1 div.sk-serial::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: 0;}#sk-container-id-1 div.sk-serial {display: flex;flex-direction: column;align-items: center;background-color: white;padding-right: 0.2em;padding-left: 0.2em;position: relative;}#sk-container-id-1 div.sk-item {position: relative;z-index: 1;}#sk-container-id-1 div.sk-parallel {display: flex;align-items: stretch;justify-content: center;background-color: white;position: relative;}#sk-container-id-1 div.sk-item::before, #sk-container-id-1 div.sk-parallel-item::before {content: \"\";position: absolute;border-left: 1px solid gray;box-sizing: border-box;top: 0;bottom: 0;left: 50%;z-index: -1;}#sk-container-id-1 div.sk-parallel-item {display: flex;flex-direction: column;z-index: 1;position: relative;background-color: white;}#sk-container-id-1 div.sk-parallel-item:first-child::after {align-self: flex-end;width: 50%;}#sk-container-id-1 div.sk-parallel-item:last-child::after {align-self: flex-start;width: 50%;}#sk-container-id-1 div.sk-parallel-item:only-child::after {width: 0;}#sk-container-id-1 div.sk-dashed-wrapped {border: 1px dashed gray;margin: 0 0.4em 0.5em 0.4em;box-sizing: border-box;padding-bottom: 0.4em;background-color: white;}#sk-container-id-1 div.sk-label label {font-family: monospace;font-weight: bold;display: inline-block;line-height: 1.2em;}#sk-container-id-1 div.sk-label-container {text-align: center;}#sk-container-id-1 div.sk-container {/* jupyter's `normalize.less` sets `[hidden] { display: none; }` but bootstrap.min.css set `[hidden] { display: none !important; }` so we also need the `!important` here to be able to override the default hidden behavior on the sphinx rendered scikit-learn.org. See: https://github.com/scikit-learn/scikit-learn/issues/21755 */display: inline-block !important;position: relative;}#sk-container-id-1 div.sk-text-repr-fallback {display: none;}</style><div id=\"sk-container-id-1\" class=\"sk-top-container\"><div class=\"sk-text-repr-fallback\"><pre>Pipeline(steps=[('tfidf', TfidfVectorizer()), ('nb', MultinomialNB())])</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\"sk-container\" hidden><div class=\"sk-item sk-dashed-wrapped\"><div class=\"sk-label-container\"><div class=\"sk-label sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-1\" type=\"checkbox\" ><label for=\"sk-estimator-id-1\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">Pipeline</label><div class=\"sk-toggleable__content\"><pre>Pipeline(steps=[('tfidf', TfidfVectorizer()), ('nb', MultinomialNB())])</pre></div></div></div><div class=\"sk-serial\"><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-2\" type=\"checkbox\" ><label for=\"sk-estimator-id-2\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">TfidfVectorizer</label><div class=\"sk-toggleable__content\"><pre>TfidfVectorizer()</pre></div></div></div><div class=\"sk-item\"><div class=\"sk-estimator sk-toggleable\"><input class=\"sk-toggleable__control sk-hidden--visually\" id=\"sk-estimator-id-3\" type=\"checkbox\" ><label for=\"sk-estimator-id-3\" class=\"sk-toggleable__label sk-toggleable__label-arrow\">MultinomialNB</label><div class=\"sk-toggleable__content\"><pre>MultinomialNB()</pre></div></div></div></div></div></div></div>"]},"metadata":{},"execution_count":35}],"source":["sentiment_pipeline.fit(train_data, train_labels)\n"]},{"cell_type":"markdown","id":"4c95c599-ae0d-433f-9ed5-856fd9fa35e0","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"4c95c599-ae0d-433f-9ed5-856fd9fa35e0"},"source":["### Make predictions on the test set"]},{"cell_type":"code","execution_count":36,"id":"37ae9eda-4a02-4f40-bdeb-ecb8ea67f9d3","metadata":{"tags":[],"id":"37ae9eda-4a02-4f40-bdeb-ecb8ea67f9d3","executionInfo":{"status":"ok","timestamp":1713844081489,"user_tz":-420,"elapsed":3301,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}}},"outputs":[],"source":["predictions = sentiment_pipeline.predict(test_data)"]},{"cell_type":"code","source":["test_data[1]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":109},"id":"a620DunmGUpx","executionInfo":{"status":"ok","timestamp":1713844697926,"user_tz":-420,"elapsed":4,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"6109017f-a264-46b9-cd2a-db7d91158ba0"},"id":"a620DunmGUpx","execution_count":43,"outputs":[{"output_type":"execute_result","data":{"text/plain":["'A wonderful little production. <br /><br />The filming technique is very unassuming- very old-time-BBC fashion and gives a comforting, and sometimes discomforting, sense of realism to the entire piece. <br /><br />The actors are extremely well chosen- Michael Sheen not only \"has got all the polari\" but he has all the voices down pat too! You can truly see the seamless editing guided by the references to Williams\\' diary entries, not only is it well worth the watching but it is a terrificly written and performed piece. A masterful production about one of the great master\\'s of comedy and his life. <br /><br />The realism really comes home with the little things: the fantasy of the guard which, rather than use the traditional \\'dream\\' techniques remains solid then disappears. It plays on our knowledge and our senses, particularly with the scenes concerning Orton and Halliwell and the sets (particularly of their flat with Halliwell\\'s murals decorating every surface) are terribly well done.'"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"string"}},"metadata":{},"execution_count":43}]},{"cell_type":"code","source":["test_labels[1]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":36},"id":"qmW5xhMgGae6","executionInfo":{"status":"ok","timestamp":1713844689037,"user_tz":-420,"elapsed":4,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2f9176d6-62cc-454b-cf06-292c2682f59f"},"id":"qmW5xhMgGae6","execution_count":41,"outputs":[{"output_type":"execute_result","data":{"text/plain":["'positive'"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"string"}},"metadata":{},"execution_count":41}]},{"cell_type":"code","source":["predictions"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"9p7uhKVvEXQn","executionInfo":{"status":"ok","timestamp":1713844095757,"user_tz":-420,"elapsed":312,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"310851b4-6a8e-4308-f477-a932a640c26c"},"id":"9p7uhKVvEXQn","execution_count":37,"outputs":[{"output_type":"execute_result","data":{"text/plain":["array(['negative', 'positive', 'negative', ..., 'negative', 'positive',\n"," 'positive'], dtype='<U8')"]},"metadata":{},"execution_count":37}]},{"cell_type":"markdown","id":"a33458e2-90cb-4c94-b977-8cc8ea5a273e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"a33458e2-90cb-4c94-b977-8cc8ea5a273e"},"source":["### Evaluate the model"]},{"cell_type":"code","source":["test_data.shape"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"XDecs57CGtrY","executionInfo":{"status":"ok","timestamp":1713844728124,"user_tz":-420,"elapsed":387,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"2e38875f-dc30-455f-ec6c-4a66024c76ba"},"id":"XDecs57CGtrY","execution_count":44,"outputs":[{"output_type":"execute_result","data":{"text/plain":["(15000,)"]},"metadata":{},"execution_count":44}]},{"cell_type":"code","source":["test_labels.shape"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"KfDAFQETG1b-","executionInfo":{"status":"ok","timestamp":1713844744202,"user_tz":-420,"elapsed":2,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"245bf06a-0b44-4466-ba0f-c4fde614c1cc"},"id":"KfDAFQETG1b-","execution_count":45,"outputs":[{"output_type":"execute_result","data":{"text/plain":["(15000,)"]},"metadata":{},"execution_count":45}]},{"cell_type":"code","execution_count":46,"id":"9ad90567-93d2-4090-81be-5c77f41e379a","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"9ad90567-93d2-4090-81be-5c77f41e379a","executionInfo":{"status":"ok","timestamp":1713844759769,"user_tz":-420,"elapsed":831,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"f7aad793-8a18-4799-85f4-11d3b5df0955"},"outputs":[{"output_type":"stream","name":"stdout","text":["Classification Report:\n"," precision recall f1-score support\n","\n"," negative 0.84 0.89 0.86 7411\n"," positive 0.89 0.83 0.86 7589\n","\n"," accuracy 0.86 15000\n"," macro avg 0.86 0.86 0.86 15000\n","weighted avg 0.86 0.86 0.86 15000\n","\n"]}],"source":["\n","report = classification_report(test_labels, predictions)\n","\n","print(\"Classification Report:\\n\", report)"]},{"cell_type":"code","execution_count":47,"id":"ef002e29-d065-4825-a076-3d23fdfa7b59","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"ef002e29-d065-4825-a076-3d23fdfa7b59","executionInfo":{"status":"ok","timestamp":1713844776999,"user_tz":-420,"elapsed":331,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"8ebfdcdc-b29a-4e50-a8c1-c32256472966"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["array([[6620, 791],\n"," [1296, 6293]])"]},"metadata":{},"execution_count":47}],"source":["cm = confusion_matrix(test_labels, predictions)\n","cm"]},{"cell_type":"markdown","id":"6e7729bb-a833-4feb-bd2a-b04a2741bd70","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"6e7729bb-a833-4feb-bd2a-b04a2741bd70"},"source":["## Huggingface: Pre-trained sentiment analysis model\n","\n","https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english"]},{"cell_type":"code","execution_count":48,"id":"9afad444-c2cc-4f3d-b49d-07a723be6154","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":291,"referenced_widgets":["6b743d09e2a24a54a0302a0aee69cc90","764f39f3c28841ba9d96fcda0daa750f","dfef59134fb040c99e9d5e2d22704629","2d753be068804858bd6a158932e8be07","c62ddd64f9c84a8f958b59c7eb3907fe","32d4d98140914c6c97bbd3b18902cef3","ab486ae08df34e688cb514a0f1ff17e8","9e094454e05f432fac232399c525c820","1fad54a4f83147eaac49f8bfd07786be","4e5b866634e342119e8c17b299c494d3","868625142e274217806ae6793e7bba1e","57fdcbfad44045d9926eb6be9b0e98e4","6f76b70971734347af420200eb4e7961","227592f3c9ce45ed980e06711e16da32","553d95aeca14426ea0cfe1658c670929","20e75f776514473b917f07a1f948bbee","21752585844c4b0a9d3e9be9a91e08ec","92823464dc54474cbff9219bfd4d7e85","0955564b996f4ce296532505fcf7b2b5","dcabc828dbe04b73ac7667ed57cddba4","5778deb87339492886307c0a27e48941","935ade78484944fc9fc3822b86629ae7","a7d41b7b84854d81aa4fd154e4cd95cf","c038edf8e1b246b0956232182e5aa083","3b8487f5e7cb4ba5b13173f5afa41743","19dbb9ba4aa6461da50f7c27dae38194","014878ccbd574925a16453332f50b006","e09f5c2db82d4a8f85522a4da34b8e39","2ef82c50224f492aa999726610a399a1","32d1750a89c24d2f8adc77795355fee8","5bcc77b7a6d34a0dae6d00278d221d5e","d83e05f8c52445edbe640678b8961dd4","502fd49e91d94d6f8a35b5d755d74af1","9a6820b62ba24698b607aa592c2569f4","e57391fa7a9449d18de6d6cdb2fb8b22","27869bcaf68344d3b051270dbbfd2f14","045cdec112a4421b8867cdc0f3c51312","d7f66508bf454fcdbe3b86049b3b07dd","92b7a96a86bb4354b9201b5a6c797464","bb6c8ec2753c4a13ac5d830b27a5b086","18d0ecc027564d52a35ac3de71e14e5d","35dfe7bbe8334855b42a555400fa2bac","28671e25f8c94f539252c2ee0c4423ac","5b9ec995dc9842f181644d1b02806333"]},"id":"9afad444-c2cc-4f3d-b49d-07a723be6154","executionInfo":{"status":"ok","timestamp":1713844938786,"user_tz":-420,"elapsed":18112,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"06e47173-f131-45c9-8383-73b169407e74"},"outputs":[{"output_type":"stream","name":"stderr","text":["/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:88: UserWarning: \n","The secret `HF_TOKEN` does not exist in your Colab secrets.\n","To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n","You will be able to reuse this secret in all of your notebooks.\n","Please note that authentication is recommended but still optional to access public models or datasets.\n"," warnings.warn(\n"]},{"output_type":"display_data","data":{"text/plain":["config.json: 0%| | 0.00/629 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6b743d09e2a24a54a0302a0aee69cc90"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["model.safetensors: 0%| | 0.00/268M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"57fdcbfad44045d9926eb6be9b0e98e4"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer_config.json: 0%| | 0.00/48.0 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a7d41b7b84854d81aa4fd154e4cd95cf"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["vocab.txt: 0%| | 0.00/232k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"9a6820b62ba24698b607aa592c2569f4"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["[{'label': 'POSITIVE', 'score': 0.9998656511306763},\n"," {'label': 'NEGATIVE', 'score': 0.9991129040718079}]"]},"metadata":{},"execution_count":48}],"source":["\n","from transformers import pipeline\n","sentiment_analyzer = pipeline('sentiment-analysis', model =\"distilbert-base-uncased-finetuned-sst-2-english\") #, revision =\"af0f99b\")\n","data = [\"I love you\", \"I hate you\"]\n","sentiment_analyzer(data)\n"]},{"cell_type":"code","execution_count":49,"id":"4987efd9-8ca8-40b1-90cc-ff361207fb8f","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"4987efd9-8ca8-40b1-90cc-ff361207fb8f","executionInfo":{"status":"ok","timestamp":1713844974003,"user_tz":-420,"elapsed":327,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"4e317a6e-3b89-4218-e33a-cbcbe6773ad4"},"outputs":[{"output_type":"stream","name":"stdout","text":["[{'label': 'POSITIVE', 'score': 0.9996837377548218}]\n"]}],"source":["result = sentiment_analyzer(\"I love using this model!\")\n","print(result)"]},{"cell_type":"markdown","id":"68436dda-e3c3-499d-b390-60443f9a1796","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"68436dda-e3c3-499d-b390-60443f9a1796"},"source":["## Huggingface: Thai"]},{"cell_type":"markdown","id":"72a9f8e0-12bf-403b-8b78-e381a65e9eaa","metadata":{"id":"72a9f8e0-12bf-403b-8b78-e381a65e9eaa"},"source":["### model=\"poom-sci/WangchanBERTa-finetuned-sentiment\"\n","\n","https://huggingface.co/poom-sci/WangchanBERTa-finetuned-sentiment"]},{"cell_type":"code","execution_count":50,"id":"d698825b-3bd7-4370-871f-ac6e5fe5fe47","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/","height":245,"referenced_widgets":["a9e58e66a3b74a7a970d39c82240ee3d","d92b56350ecc4599920d9a639d985e48","799faec48b7c4b4a8217a7ae95a3348e","7655233e992f4487a8ffb26b775f203c","6cc7ca687d364b0aa320405368cebfb1","81cf201494024fdb86fb8aba5fec1684","b5eaf04b11284c13b24b5de37760b6ac","18a4efa47c184134b1fb9b1b4192e766","fbd0194ca4044406b2687d56d0006ea7","0d5462301c70484fa0af5f7d7bf5f870","3eb96c9075b04716ae3efeaa84ab027c","e697264388a941b1b296a6ffd94c4955","7619792f1e804121bd210faebd479fec","d7609127cb61448eb0375ad5eaf5a464","9588b4252d554a3caaed831a4da17769","ab426d04502b4114aa5238a0acab1325","39361e3cbf2644cc986b57dafed52e7b","87b90dc01ab545cba91c3313ad61de4e","2b13da36a00343b7929479c35826fe50","38b4787b345e48c3b945b429664f8d3d","079587d2e31546879f8349ade0007505","e9e7c9ca02934159946e6d0d77e6aaa2","eaf3e21d333545a7b6f99f4a3c2dd32d","80a0f41ee58d4dbd9068a2da541e7ab1","d0e4c46296d5466b93ca20a6dedf6ca2","67a23012dc984dcba98c2bbe3345f47c","425bb0a1ca204144a59f5352eae932cb","aef4654647424865bc40844d174666ce","fa71ffe79a5841aa83cbb2712af0d2ed","0dec19543ab842dfaa0c9672da1341ac","c8abf179a9ec4539a1f67a94af1b5ebd","a9b09ef660f04001b1540fbaa8fb8619","14b4c51735484be285cd540a15ea71e4","a9b5ad8768474490a496e527e5434285","a891122437dc425bb13c831efe311e69","4cec9a9f2630431db8a626f2332e8eba","3ab1d042923e426991132a0e4d5d9214","6cef7c9514e74a7d9e0e8ad6a45c2764","20c6909e78f8420d82d7ccd4a3b90600","21db3d4f160f4d6a8d16d56b1f8145c1","af663b93360045a1ac9c5a553895f8dd","e57f85a430494e049cfefb631ca80c4b","dcc24dba7e014f03b6507e4674fdedbd","cbf5367b9a474cd597126f9b44a091a2","edee0ea2881947d88a88e30bbe704227","fbc7838167cd4416b67d23019b6449cc","23bd28ecfee94b879aa9a7242ff5f3a8","951dca5617c147f1ac4e13420dbc8092","0729c7bad2c54b468c652a3636a3f33a","aa8d847812bd4c3caeb1155f1bbd47e8","af97f90e51054a8d9e7114e131a20a76","8f9db8f97d43461b930600d5f728e630","ad24f48277ce4cb6bdd08829bbbafb7f","22e3e9e7755049a28fc2133b3cad808a","5efc41cf659f4146a01263112f58b43c","77cb395146a545148f7784450c10e4fd","cf00433fc3ff4e46bea7b268cf585ffa","69866f6b67e94c0e87519f1a47dfaf3b","570414a7ae604eef88fc2a2c38637bff","e53c8ef1e9e64c46b28444192c7f6005","05e5df8dd9a94658afbd9968c6a88196","d5de73166aaf41ccbb8795bc0a76cd66","d875b3552444402d80b870192244c726","cf2e96fc2f09426393a7339c1b8882e3","cf7a76769a934ea292595d4d84d19757","3e4c9662eb0a4d6fa372ffd33d0feaff"]},"id":"d698825b-3bd7-4370-871f-ac6e5fe5fe47","executionInfo":{"status":"ok","timestamp":1713844989621,"user_tz":-420,"elapsed":7775,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"662bbdb1-1ea5-411f-b4af-b28a47581779"},"outputs":[{"output_type":"display_data","data":{"text/plain":["config.json: 0%| | 0.00/965 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a9e58e66a3b74a7a970d39c82240ee3d"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["pytorch_model.bin: 0%| | 0.00/421M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"e697264388a941b1b296a6ffd94c4955"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer_config.json: 0%| | 0.00/491 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"eaf3e21d333545a7b6f99f4a3c2dd32d"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["sentencepiece.bpe.model: 0%| | 0.00/905k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a9b5ad8768474490a496e527e5434285"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["tokenizer.json: 0%| | 0.00/1.38M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"edee0ea2881947d88a88e30bbe704227"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["special_tokens_map.json: 0%| | 0.00/305 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"77cb395146a545148f7784450c10e4fd"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["[{'label': 'pos', 'score': 0.9793058037757874},\n"," {'label': 'neg', 'score': 0.7835226058959961}]"]},"metadata":{},"execution_count":50}],"source":["from transformers import pipeline\n","\n","sentiment_analyzer = pipeline('sentiment-analysis', model=\"poom-sci/WangchanBERTa-finetuned-sentiment\")#, revision=\"b78d071\")\n","\n","data = [\"ΰΈΰΈ£ΰΉΰΈΰΈ’ΰΈΰΈ±ΰΈΰΉ\", \"ΰΈ£ΰΈΰΈΰΈ²ΰΈΰΉΰΈΰΉ\"]\n","sentiment_analyzer(data)\n"]},{"cell_type":"code","execution_count":51,"id":"87d815d4-135c-471e-93ee-cacc93653d4e","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"87d815d4-135c-471e-93ee-cacc93653d4e","executionInfo":{"status":"ok","timestamp":1713844999105,"user_tz":-420,"elapsed":404,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"a9ee94dc-6c6f-4345-f4e8-409c45efc9d3"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["[{'label': 'neg', 'score': 0.7488928437232971}]"]},"metadata":{},"execution_count":51}],"source":["sentiment_analyzer(\"ΰΈΰΉΰΈ²ΰΈ§ΰΈΰΈΉΰΈ\")"]},{"cell_type":"code","execution_count":null,"id":"60f5c43a-6cb7-47f1-85c5-751e91599ad9","metadata":{"id":"60f5c43a-6cb7-47f1-85c5-751e91599ad9"},"outputs":[],"source":[]},{"cell_type":"markdown","id":"f894a4bd-1f04-4126-aa8d-e0211b41687e","metadata":{"jp-MarkdownHeadingCollapsed":true,"tags":[],"id":"f894a4bd-1f04-4126-aa8d-e0211b41687e"},"source":["## Deploy on Streamlit Sharing\n","\n","https://share.streamlit.io/ or https://huggingface.co/spaces\n","\n","https://docs.streamlit.io/library/api-reference\n","\n","https://github.com/\n","\n"]},{"cell_type":"code","execution_count":52,"id":"dfd5baee-dc74-4f6d-84be-52a2b89d0f28","metadata":{"tags":[],"colab":{"base_uri":"https://localhost:8080/"},"id":"dfd5baee-dc74-4f6d-84be-52a2b89d0f28","executionInfo":{"status":"ok","timestamp":1713845688947,"user_tz":-420,"elapsed":361,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"c880bab7-3b44-44cb-dda9-e674a5edf97f"},"outputs":[{"output_type":"stream","name":"stdout","text":["Writing app_senti_65130700309.py\n"]}],"source":["\n","%%writefile app_senti_65130700309.py\n","\n","\n","import streamlit as st\n","from transformers import pipeline\n","\n","# Load the sentiment analysis model\n","model_name = \"poom-sci/WangchanBERTa-finetuned-sentiment\"\n","sentiment_analyzer = pipeline('sentiment-analysis', model=model_name)\n","\n","# Streamlit app\n","st.title(\"Thai Sentiment Analysis App\")\n","\n","# Input text\n","text_input = st.text_area(\"Enter Thai text for sentiment analysis\", \"ΰΈΰΈΰΈΰΈ§ΰΈ²ΰΈ‘ΰΉΰΈ«ΰΉΰΈΰΈ«ΰΈΰΉΰΈΰΈ’... \")\n","\n","# Button to trigger analysis\n","if st.button(\"Analyze Sentiment\"):\n"," # Analyze sentiment using the model\n"," results = sentiment_analyzer([text_input])\n","\n"," # Extract sentiment and score\n"," sentiment = results[0]['label']\n"," score = results[0]['score']\n","\n","\n"," # Display result as progress bars\n"," st.subheader(\"Sentiment Analysis Result:\")\n","\n"," if sentiment == 'pos':\n"," st.success(f\"Positive Sentiment (Score: {score:.2f})\")\n"," st.progress(score)\n"," elif sentiment == 'neg':\n"," st.error(f\"Negative Sentiment (Score: {score:.2f})\")\n"," st.progress(score)\n"," else:\n"," st.warning(f\"Neutral Sentiment (Score: {score:.2f})\")\n"," st.progress(score)\n"]},{"cell_type":"code","execution_count":53,"id":"70111967-b904-4f18-a8d0-0c8701ec35ab","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"70111967-b904-4f18-a8d0-0c8701ec35ab","executionInfo":{"status":"ok","timestamp":1713845696482,"user_tz":-420,"elapsed":341,"user":{"displayName":"wannisa paethong","userId":"05174644342145313126"}},"outputId":"4eb475a7-6b7b-44a0-e09b-32150e4d717b"},"outputs":[{"output_type":"stream","name":"stdout","text":["Writing requirements.txt\n"]}],"source":["%%writefile requirements.txt\n","transformers\n","torch\n"]},{"cell_type":"code","execution_count":null,"id":"88001002-587d-403d-ab65-d060bde9d42d","metadata":{"id":"88001002-587d-403d-ab65-d060bde9d42d"},"outputs":[],"source":[]}],"metadata":{"kernelspec":{"display_name":"Python 3 (ipykernel)","language":"python","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.11.3"},"colab":{"provenance":[]},"widgets":{"application/vnd.jupyter.widget-state+json":{"6b743d09e2a24a54a0302a0aee69cc90":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_764f39f3c28841ba9d96fcda0daa750f","IPY_MODEL_dfef59134fb040c99e9d5e2d22704629","IPY_MODEL_2d753be068804858bd6a158932e8be07"],"layout":"IPY_MODEL_c62ddd64f9c84a8f958b59c7eb3907fe"}},"764f39f3c28841ba9d96fcda0daa750f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_32d4d98140914c6c97bbd3b18902cef3","placeholder":"β","style":"IPY_MODEL_ab486ae08df34e688cb514a0f1ff17e8","value":"config.json:β100%"}},"dfef59134fb040c99e9d5e2d22704629":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_9e094454e05f432fac232399c525c820","max":629,"min":0,"orientation":"horizontal","style":"IPY_MODEL_1fad54a4f83147eaac49f8bfd07786be","value":629}},"2d753be068804858bd6a158932e8be07":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_4e5b866634e342119e8c17b299c494d3","placeholder":"β","style":"IPY_MODEL_868625142e274217806ae6793e7bba1e","value":"β629/629β[00:00<00:00,β22.0kB/s]"}},"c62ddd64f9c84a8f958b59c7eb3907fe":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"32d4d98140914c6c97bbd3b18902cef3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ab486ae08df34e688cb514a0f1ff17e8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9e094454e05f432fac232399c525c820":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"1fad54a4f83147eaac49f8bfd07786be":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"4e5b866634e342119e8c17b299c494d3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"868625142e274217806ae6793e7bba1e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"57fdcbfad44045d9926eb6be9b0e98e4":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_6f76b70971734347af420200eb4e7961","IPY_MODEL_227592f3c9ce45ed980e06711e16da32","IPY_MODEL_553d95aeca14426ea0cfe1658c670929"],"layout":"IPY_MODEL_20e75f776514473b917f07a1f948bbee"}},"6f76b70971734347af420200eb4e7961":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_21752585844c4b0a9d3e9be9a91e08ec","placeholder":"β","style":"IPY_MODEL_92823464dc54474cbff9219bfd4d7e85","value":"model.safetensors:β100%"}},"227592f3c9ce45ed980e06711e16da32":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_0955564b996f4ce296532505fcf7b2b5","max":267832558,"min":0,"orientation":"horizontal","style":"IPY_MODEL_dcabc828dbe04b73ac7667ed57cddba4","value":267832558}},"553d95aeca14426ea0cfe1658c670929":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5778deb87339492886307c0a27e48941","placeholder":"β","style":"IPY_MODEL_935ade78484944fc9fc3822b86629ae7","value":"β268M/268Mβ[00:02<00:00,β56.5MB/s]"}},"20e75f776514473b917f07a1f948bbee":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"21752585844c4b0a9d3e9be9a91e08ec":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"92823464dc54474cbff9219bfd4d7e85":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"0955564b996f4ce296532505fcf7b2b5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"dcabc828dbe04b73ac7667ed57cddba4":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5778deb87339492886307c0a27e48941":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"935ade78484944fc9fc3822b86629ae7":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a7d41b7b84854d81aa4fd154e4cd95cf":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_c038edf8e1b246b0956232182e5aa083","IPY_MODEL_3b8487f5e7cb4ba5b13173f5afa41743","IPY_MODEL_19dbb9ba4aa6461da50f7c27dae38194"],"layout":"IPY_MODEL_014878ccbd574925a16453332f50b006"}},"c038edf8e1b246b0956232182e5aa083":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e09f5c2db82d4a8f85522a4da34b8e39","placeholder":"β","style":"IPY_MODEL_2ef82c50224f492aa999726610a399a1","value":"tokenizer_config.json:β100%"}},"3b8487f5e7cb4ba5b13173f5afa41743":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_32d1750a89c24d2f8adc77795355fee8","max":48,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5bcc77b7a6d34a0dae6d00278d221d5e","value":48}},"19dbb9ba4aa6461da50f7c27dae38194":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d83e05f8c52445edbe640678b8961dd4","placeholder":"β","style":"IPY_MODEL_502fd49e91d94d6f8a35b5d755d74af1","value":"β48.0/48.0β[00:00<00:00,β1.73kB/s]"}},"014878ccbd574925a16453332f50b006":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e09f5c2db82d4a8f85522a4da34b8e39":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2ef82c50224f492aa999726610a399a1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"32d1750a89c24d2f8adc77795355fee8":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5bcc77b7a6d34a0dae6d00278d221d5e":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"d83e05f8c52445edbe640678b8961dd4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"502fd49e91d94d6f8a35b5d755d74af1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9a6820b62ba24698b607aa592c2569f4":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_e57391fa7a9449d18de6d6cdb2fb8b22","IPY_MODEL_27869bcaf68344d3b051270dbbfd2f14","IPY_MODEL_045cdec112a4421b8867cdc0f3c51312"],"layout":"IPY_MODEL_d7f66508bf454fcdbe3b86049b3b07dd"}},"e57391fa7a9449d18de6d6cdb2fb8b22":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_92b7a96a86bb4354b9201b5a6c797464","placeholder":"β","style":"IPY_MODEL_bb6c8ec2753c4a13ac5d830b27a5b086","value":"vocab.txt:β100%"}},"27869bcaf68344d3b051270dbbfd2f14":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_18d0ecc027564d52a35ac3de71e14e5d","max":231508,"min":0,"orientation":"horizontal","style":"IPY_MODEL_35dfe7bbe8334855b42a555400fa2bac","value":231508}},"045cdec112a4421b8867cdc0f3c51312":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_28671e25f8c94f539252c2ee0c4423ac","placeholder":"β","style":"IPY_MODEL_5b9ec995dc9842f181644d1b02806333","value":"β232k/232kβ[00:00<00:00,β4.50MB/s]"}},"d7f66508bf454fcdbe3b86049b3b07dd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"92b7a96a86bb4354b9201b5a6c797464":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"bb6c8ec2753c4a13ac5d830b27a5b086":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"18d0ecc027564d52a35ac3de71e14e5d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"35dfe7bbe8334855b42a555400fa2bac":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"28671e25f8c94f539252c2ee0c4423ac":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5b9ec995dc9842f181644d1b02806333":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a9e58e66a3b74a7a970d39c82240ee3d":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_d92b56350ecc4599920d9a639d985e48","IPY_MODEL_799faec48b7c4b4a8217a7ae95a3348e","IPY_MODEL_7655233e992f4487a8ffb26b775f203c"],"layout":"IPY_MODEL_6cc7ca687d364b0aa320405368cebfb1"}},"d92b56350ecc4599920d9a639d985e48":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_81cf201494024fdb86fb8aba5fec1684","placeholder":"β","style":"IPY_MODEL_b5eaf04b11284c13b24b5de37760b6ac","value":"config.json:β100%"}},"799faec48b7c4b4a8217a7ae95a3348e":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_18a4efa47c184134b1fb9b1b4192e766","max":965,"min":0,"orientation":"horizontal","style":"IPY_MODEL_fbd0194ca4044406b2687d56d0006ea7","value":965}},"7655233e992f4487a8ffb26b775f203c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_0d5462301c70484fa0af5f7d7bf5f870","placeholder":"β","style":"IPY_MODEL_3eb96c9075b04716ae3efeaa84ab027c","value":"β965/965β[00:00<00:00,β34.6kB/s]"}},"6cc7ca687d364b0aa320405368cebfb1":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"81cf201494024fdb86fb8aba5fec1684":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b5eaf04b11284c13b24b5de37760b6ac":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"18a4efa47c184134b1fb9b1b4192e766":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fbd0194ca4044406b2687d56d0006ea7":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"0d5462301c70484fa0af5f7d7bf5f870":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3eb96c9075b04716ae3efeaa84ab027c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e697264388a941b1b296a6ffd94c4955":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_7619792f1e804121bd210faebd479fec","IPY_MODEL_d7609127cb61448eb0375ad5eaf5a464","IPY_MODEL_9588b4252d554a3caaed831a4da17769"],"layout":"IPY_MODEL_ab426d04502b4114aa5238a0acab1325"}},"7619792f1e804121bd210faebd479fec":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_39361e3cbf2644cc986b57dafed52e7b","placeholder":"β","style":"IPY_MODEL_87b90dc01ab545cba91c3313ad61de4e","value":"pytorch_model.bin:β100%"}},"d7609127cb61448eb0375ad5eaf5a464":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_2b13da36a00343b7929479c35826fe50","max":421072237,"min":0,"orientation":"horizontal","style":"IPY_MODEL_38b4787b345e48c3b945b429664f8d3d","value":421072237}},"9588b4252d554a3caaed831a4da17769":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_079587d2e31546879f8349ade0007505","placeholder":"β","style":"IPY_MODEL_e9e7c9ca02934159946e6d0d77e6aaa2","value":"β421M/421Mβ[00:04<00:00,β164MB/s]"}},"ab426d04502b4114aa5238a0acab1325":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"39361e3cbf2644cc986b57dafed52e7b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"87b90dc01ab545cba91c3313ad61de4e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2b13da36a00343b7929479c35826fe50":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"38b4787b345e48c3b945b429664f8d3d":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"079587d2e31546879f8349ade0007505":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e9e7c9ca02934159946e6d0d77e6aaa2":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"eaf3e21d333545a7b6f99f4a3c2dd32d":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_80a0f41ee58d4dbd9068a2da541e7ab1","IPY_MODEL_d0e4c46296d5466b93ca20a6dedf6ca2","IPY_MODEL_67a23012dc984dcba98c2bbe3345f47c"],"layout":"IPY_MODEL_425bb0a1ca204144a59f5352eae932cb"}},"80a0f41ee58d4dbd9068a2da541e7ab1":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_aef4654647424865bc40844d174666ce","placeholder":"β","style":"IPY_MODEL_fa71ffe79a5841aa83cbb2712af0d2ed","value":"tokenizer_config.json:β100%"}},"d0e4c46296d5466b93ca20a6dedf6ca2":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_0dec19543ab842dfaa0c9672da1341ac","max":491,"min":0,"orientation":"horizontal","style":"IPY_MODEL_c8abf179a9ec4539a1f67a94af1b5ebd","value":491}},"67a23012dc984dcba98c2bbe3345f47c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a9b09ef660f04001b1540fbaa8fb8619","placeholder":"β","style":"IPY_MODEL_14b4c51735484be285cd540a15ea71e4","value":"β491/491β[00:00<00:00,β16.6kB/s]"}},"425bb0a1ca204144a59f5352eae932cb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"aef4654647424865bc40844d174666ce":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fa71ffe79a5841aa83cbb2712af0d2ed":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"0dec19543ab842dfaa0c9672da1341ac":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c8abf179a9ec4539a1f67a94af1b5ebd":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a9b09ef660f04001b1540fbaa8fb8619":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"14b4c51735484be285cd540a15ea71e4":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a9b5ad8768474490a496e527e5434285":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a891122437dc425bb13c831efe311e69","IPY_MODEL_4cec9a9f2630431db8a626f2332e8eba","IPY_MODEL_3ab1d042923e426991132a0e4d5d9214"],"layout":"IPY_MODEL_6cef7c9514e74a7d9e0e8ad6a45c2764"}},"a891122437dc425bb13c831efe311e69":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_20c6909e78f8420d82d7ccd4a3b90600","placeholder":"β","style":"IPY_MODEL_21db3d4f160f4d6a8d16d56b1f8145c1","value":"sentencepiece.bpe.model:β100%"}},"4cec9a9f2630431db8a626f2332e8eba":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_af663b93360045a1ac9c5a553895f8dd","max":904693,"min":0,"orientation":"horizontal","style":"IPY_MODEL_e57f85a430494e049cfefb631ca80c4b","value":904693}},"3ab1d042923e426991132a0e4d5d9214":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_dcc24dba7e014f03b6507e4674fdedbd","placeholder":"β","style":"IPY_MODEL_cbf5367b9a474cd597126f9b44a091a2","value":"β905k/905kβ[00:00<00:00,β2.94MB/s]"}},"6cef7c9514e74a7d9e0e8ad6a45c2764":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"20c6909e78f8420d82d7ccd4a3b90600":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"21db3d4f160f4d6a8d16d56b1f8145c1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"af663b93360045a1ac9c5a553895f8dd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e57f85a430494e049cfefb631ca80c4b":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"dcc24dba7e014f03b6507e4674fdedbd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cbf5367b9a474cd597126f9b44a091a2":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"edee0ea2881947d88a88e30bbe704227":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_fbc7838167cd4416b67d23019b6449cc","IPY_MODEL_23bd28ecfee94b879aa9a7242ff5f3a8","IPY_MODEL_951dca5617c147f1ac4e13420dbc8092"],"layout":"IPY_MODEL_0729c7bad2c54b468c652a3636a3f33a"}},"fbc7838167cd4416b67d23019b6449cc":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_aa8d847812bd4c3caeb1155f1bbd47e8","placeholder":"β","style":"IPY_MODEL_af97f90e51054a8d9e7114e131a20a76","value":"tokenizer.json:β100%"}},"23bd28ecfee94b879aa9a7242ff5f3a8":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_8f9db8f97d43461b930600d5f728e630","max":1377628,"min":0,"orientation":"horizontal","style":"IPY_MODEL_ad24f48277ce4cb6bdd08829bbbafb7f","value":1377628}},"951dca5617c147f1ac4e13420dbc8092":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_22e3e9e7755049a28fc2133b3cad808a","placeholder":"β","style":"IPY_MODEL_5efc41cf659f4146a01263112f58b43c","value":"β1.38M/1.38Mβ[00:00<00:00,β31.3MB/s]"}},"0729c7bad2c54b468c652a3636a3f33a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"aa8d847812bd4c3caeb1155f1bbd47e8":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"af97f90e51054a8d9e7114e131a20a76":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8f9db8f97d43461b930600d5f728e630":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ad24f48277ce4cb6bdd08829bbbafb7f":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"22e3e9e7755049a28fc2133b3cad808a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5efc41cf659f4146a01263112f58b43c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"77cb395146a545148f7784450c10e4fd":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_cf00433fc3ff4e46bea7b268cf585ffa","IPY_MODEL_69866f6b67e94c0e87519f1a47dfaf3b","IPY_MODEL_570414a7ae604eef88fc2a2c38637bff"],"layout":"IPY_MODEL_e53c8ef1e9e64c46b28444192c7f6005"}},"cf00433fc3ff4e46bea7b268cf585ffa":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_05e5df8dd9a94658afbd9968c6a88196","placeholder":"β","style":"IPY_MODEL_d5de73166aaf41ccbb8795bc0a76cd66","value":"special_tokens_map.json:β100%"}},"69866f6b67e94c0e87519f1a47dfaf3b":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_d875b3552444402d80b870192244c726","max":305,"min":0,"orientation":"horizontal","style":"IPY_MODEL_cf2e96fc2f09426393a7339c1b8882e3","value":305}},"570414a7ae604eef88fc2a2c38637bff":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_cf7a76769a934ea292595d4d84d19757","placeholder":"β","style":"IPY_MODEL_3e4c9662eb0a4d6fa372ffd33d0feaff","value":"β305/305β[00:00<00:00,β16.4kB/s]"}},"e53c8ef1e9e64c46b28444192c7f6005":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"05e5df8dd9a94658afbd9968c6a88196":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d5de73166aaf41ccbb8795bc0a76cd66":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"d875b3552444402d80b870192244c726":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cf2e96fc2f09426393a7339c1b8882e3":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"cf7a76769a934ea292595d4d84d19757":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3e4c9662eb0a4d6fa372ffd33d0feaff":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}}},"nbformat":4,"nbformat_minor":5} |