Spaces:

Rathgeberj
/

CS-UY4613Project

Runtime error

App Files Files Community

Jeffrey Rathgeber Jr commited on Apr 29, 2023

Commit

c7a1014

unverified ·

2 Parent(s): e3a16a8 9c787b6

Merge pull request #6 from JeffreyRathgeber/milestone-3

Browse files

Files changed (9) hide show

README.md +3 -0
TrainedModels/README.txt +1 -0
TrainedModels/tokenizer/special_tokens_map.json +7 -0
TrainedModels/tokenizer/tokenizer.json +0 -0
TrainedModels/tokenizer/tokenizer_config.json +13 -0
TrainedModels/tokenizer/vocab.txt +0 -0
TrainingAlgo.ipynb +2406 -0
aiprojecttest.py +0 -215
app.py +0 -1

README.md CHANGED Viewed

@@ -12,6 +12,9 @@ pinned: false
 # CSUY4613-Assignments
 JEFFREY RATHGEBER jr5349
 PROJECT MILESTONE 2 README  link
 https://huggingface.co/spaces/Rathgeberj/CS-UY4613Project

 # CSUY4613-Assignments
 JEFFREY RATHGEBER jr5349
+PROJECT MILESTONE 3 README LINK
+https://huggingface.co/spaces/Rathgeberj/CS-UY4613Project
 PROJECT MILESTONE 2 README  link
 https://huggingface.co/spaces/Rathgeberj/CS-UY4613Project

TrainedModels/README.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ ACTUAL MODELS TOO LARGE TO UPLOAD TO GITHUB, SEE ON HUGGINGFACE SPACE MODELS

TrainedModels/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

TrainedModels/tokenizer/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

TrainedModels/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

TrainedModels/tokenizer/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

TrainingAlgo.ipynb ADDED Viewed

	@@ -0,0 +1,2406 @@

+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "language_info": {
+      "name": "python"
+    },
+    "widgets": {
+      "application/vnd.jupyter.widget-state+json": {
+        "9972abac7caf4cc6b0d98071fd7b2e05": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_b53fb6f416d8458bb0875cbace688913",
+              "IPY_MODEL_a25b06ec34a44529bd5bd686a9a381e5",
+              "IPY_MODEL_52da3fef70074ddf95a3b257dcf4b100"
+            ],
+            "layout": "IPY_MODEL_932e4324d43346e48c85af3e5d5b45c1"
+          }
+        },
+        "b53fb6f416d8458bb0875cbace688913": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_13d5e786f6294da2b6e5d90ca06c8593",
+            "placeholder": "",
+            "style": "IPY_MODEL_bbfa5943bc1c41dbaf3a2ef89ac8d0b3",
+            "value": "Downloading (…)okenizer_config.json: 100%"
+          }
+        },
+        "a25b06ec34a44529bd5bd686a9a381e5": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_3ce089610ec446c19db3bae1baa45d7a",
+            "max": 28,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_bcf06ca3212c43e0a5db7e7d4ea01375",
+            "value": 28
+          }
+        },
+        "52da3fef70074ddf95a3b257dcf4b100": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_aab6a478cec84b25a29bc0ed4ee2aaac",
+            "placeholder": "",
+            "style": "IPY_MODEL_3e6f987e297b4a2b8f3eb1b12b4b67af",
+            "value": " 28.0/28.0 [00:00&lt;00:00, 1.28kB/s]"
+          }
+        },
+        "932e4324d43346e48c85af3e5d5b45c1": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "13d5e786f6294da2b6e5d90ca06c8593": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "bbfa5943bc1c41dbaf3a2ef89ac8d0b3": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "3ce089610ec446c19db3bae1baa45d7a": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "bcf06ca3212c43e0a5db7e7d4ea01375": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "aab6a478cec84b25a29bc0ed4ee2aaac": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "3e6f987e297b4a2b8f3eb1b12b4b67af": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "3a52fbc3755a4323b749da73142e5871": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_7b2019506d154d118134985ee7e8ea43",
+              "IPY_MODEL_3a51d4dbd7654b9ab7b69a50605d29e9",
+              "IPY_MODEL_c5dd0d556c9c486baaedf3ca54cef54a"
+            ],
+            "layout": "IPY_MODEL_3b40837351f44c0f92e3e5af55da3e21"
+          }
+        },
+        "7b2019506d154d118134985ee7e8ea43": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_85a7a49bf87c4160b241a878c6b12f81",
+            "placeholder": "",
+            "style": "IPY_MODEL_9510c227a23e4d829ad9366b41babae6",
+            "value": "Downloading (…)solve/main/vocab.txt: 100%"
+          }
+        },
+        "3a51d4dbd7654b9ab7b69a50605d29e9": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_b78852da0af54675a3a1b65729eed99f",
+            "max": 231508,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_5638394766b640cdaf9208a8794636d2",
+            "value": 231508
+          }
+        },
+        "c5dd0d556c9c486baaedf3ca54cef54a": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_67535c820a3b407bb801873d788ba535",
+            "placeholder": "",
+            "style": "IPY_MODEL_365db64fb2c847a5a41b5d057d77600c",
+            "value": " 232k/232k [00:00&lt;00:00, 6.66MB/s]"
+          }
+        },
+        "3b40837351f44c0f92e3e5af55da3e21": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "85a7a49bf87c4160b241a878c6b12f81": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "9510c227a23e4d829ad9366b41babae6": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "b78852da0af54675a3a1b65729eed99f": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "5638394766b640cdaf9208a8794636d2": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "67535c820a3b407bb801873d788ba535": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "365db64fb2c847a5a41b5d057d77600c": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "d0334d8257ce422597da3d29ac22cd4f": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_eae4e7789fe54a7b98bfda99d20360bd",
+              "IPY_MODEL_5f48726592fe446ea43b7bdec668919b",
+              "IPY_MODEL_3edcc888477a440d81e8b6df174966cd"
+            ],
+            "layout": "IPY_MODEL_9a23d53c1e7a448282c1aaa36d26c4ec"
+          }
+        },
+        "eae4e7789fe54a7b98bfda99d20360bd": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_e8e2739386c045078bf2cc3987534a93",
+            "placeholder": "",
+            "style": "IPY_MODEL_bb14cd687abb432b8e2a01cd58e7c550",
+            "value": "Downloading (…)/main/tokenizer.json: 100%"
+          }
+        },
+        "5f48726592fe446ea43b7bdec668919b": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_c5c6159f813949a3851fb158a992a65c",
+            "max": 466062,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_03337be3fcd94f388ae2650078269a55",
+            "value": 466062
+          }
+        },
+        "3edcc888477a440d81e8b6df174966cd": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_ff28b23c163240dc9b543f340b9d2d52",
+            "placeholder": "",
+            "style": "IPY_MODEL_110e8e19d5f242829cc4cafdb9a10cb2",
+            "value": " 466k/466k [00:00&lt;00:00, 15.5MB/s]"
+          }
+        },
+        "9a23d53c1e7a448282c1aaa36d26c4ec": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "e8e2739386c045078bf2cc3987534a93": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "bb14cd687abb432b8e2a01cd58e7c550": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "c5c6159f813949a3851fb158a992a65c": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "03337be3fcd94f388ae2650078269a55": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "ff28b23c163240dc9b543f340b9d2d52": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "110e8e19d5f242829cc4cafdb9a10cb2": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "ee6313a98fd041c9b755be6b6a94ebff": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_40f2cc2506fd49dd9e284c1891312785",
+              "IPY_MODEL_719e9ba1b98d4170a6acff418ada38fa",
+              "IPY_MODEL_1e532190fe2b49a08a97211e3f1c60d0"
+            ],
+            "layout": "IPY_MODEL_e0ac88aa562e4354b15e182164990a79"
+          }
+        },
+        "40f2cc2506fd49dd9e284c1891312785": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_5e6bd272a50b4734a8a4dd4cb683d4e2",
+            "placeholder": "",
+            "style": "IPY_MODEL_9fd8ea0a806e4641ae945dc59baa0505",
+            "value": "Downloading (…)lve/main/config.json: 100%"
+          }
+        },
+        "719e9ba1b98d4170a6acff418ada38fa": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_941fcfabb72940a59c7fa76e3506385d",
+            "max": 483,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_23bc61b5726942169123eca1f60bd883",
+            "value": 483
+          }
+        },
+        "1e532190fe2b49a08a97211e3f1c60d0": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_b9ebd383be484f5d8fabafd4a130d6ae",
+            "placeholder": "",
+            "style": "IPY_MODEL_afdf7f80c04848fb8978d2634ee86526",
+            "value": " 483/483 [00:00&lt;00:00, 30.4kB/s]"
+          }
+        },
+        "e0ac88aa562e4354b15e182164990a79": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "5e6bd272a50b4734a8a4dd4cb683d4e2": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "9fd8ea0a806e4641ae945dc59baa0505": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "941fcfabb72940a59c7fa76e3506385d": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "23bc61b5726942169123eca1f60bd883": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "b9ebd383be484f5d8fabafd4a130d6ae": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "afdf7f80c04848fb8978d2634ee86526": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "a828e2eb329548568ea23df75056ce46": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_94f47a73ba5b402b84717807b4f127d9",
+              "IPY_MODEL_66f521247f4c4a608e4a79933ca8b499",
+              "IPY_MODEL_9012d483dc42427189bea7c35c6a9f21"
+            ],
+            "layout": "IPY_MODEL_342182d835634efd9e8dcc16c753602b"
+          }
+        },
+        "94f47a73ba5b402b84717807b4f127d9": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_a8c8ad17737448748e212de8bba42b5f",
+            "placeholder": "",
+            "style": "IPY_MODEL_e414907cc96e4e3d879a6759124fd8fe",
+            "value": "Downloading pytorch_model.bin: 100%"
+          }
+        },
+        "66f521247f4c4a608e4a79933ca8b499": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_a464bcc2342841588e7384b4c2f10a42",
+            "max": 267967963,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_6cc18dcc7a7d4361a5aac3271d47347a",
+            "value": 267967963
+          }
+        },
+        "9012d483dc42427189bea7c35c6a9f21": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_cb8c4e778a994ba7bb57f279614ebfe8",
+            "placeholder": "",
+            "style": "IPY_MODEL_739f16b75f3248489495a606ab3650ab",
+            "value": " 268M/268M [00:00&lt;00:00, 372MB/s]"
+          }
+        },
+        "342182d835634efd9e8dcc16c753602b": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "a8c8ad17737448748e212de8bba42b5f": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "e414907cc96e4e3d879a6759124fd8fe": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "a464bcc2342841588e7384b4c2f10a42": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "6cc18dcc7a7d4361a5aac3271d47347a": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "cb8c4e778a994ba7bb57f279614ebfe8": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "739f16b75f3248489495a606ab3650ab": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        }
+      }
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "code",
+      "source": [
+        "from pathlib import Path\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "import torch\n",
+        "from torch.utils.data import Dataset\n",
+        "from transformers import DistilBertTokenizerFast, DistilBertForSequenceClassification\n",
+        "from transformers import Trainer, TrainingArguments\n",
+        "from torch.utils.data import DataLoader\n",
+        "from transformers import AdamW\n",
+        "import pandas as pd\n",
+        "from huggingface_hub import notebook_login"
+      ],
+      "metadata": {
+        "id": "Bu9ttXsprt9w"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "UCoa8JqwrVXU",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 144,
+          "referenced_widgets": [
+            "9972abac7caf4cc6b0d98071fd7b2e05",
+            "b53fb6f416d8458bb0875cbace688913",
+            "a25b06ec34a44529bd5bd686a9a381e5",
+            "52da3fef70074ddf95a3b257dcf4b100",
+            "932e4324d43346e48c85af3e5d5b45c1",
+            "13d5e786f6294da2b6e5d90ca06c8593",
+            "bbfa5943bc1c41dbaf3a2ef89ac8d0b3",
+            "3ce089610ec446c19db3bae1baa45d7a",
+            "bcf06ca3212c43e0a5db7e7d4ea01375",
+            "aab6a478cec84b25a29bc0ed4ee2aaac",
+            "3e6f987e297b4a2b8f3eb1b12b4b67af",
+            "3a52fbc3755a4323b749da73142e5871",
+            "7b2019506d154d118134985ee7e8ea43",
+            "3a51d4dbd7654b9ab7b69a50605d29e9",
+            "c5dd0d556c9c486baaedf3ca54cef54a",
+            "3b40837351f44c0f92e3e5af55da3e21",
+            "85a7a49bf87c4160b241a878c6b12f81",
+            "9510c227a23e4d829ad9366b41babae6",
+            "b78852da0af54675a3a1b65729eed99f",
+            "5638394766b640cdaf9208a8794636d2",
+            "67535c820a3b407bb801873d788ba535",
+            "365db64fb2c847a5a41b5d057d77600c",
+            "d0334d8257ce422597da3d29ac22cd4f",
+            "eae4e7789fe54a7b98bfda99d20360bd",
+            "5f48726592fe446ea43b7bdec668919b",
+            "3edcc888477a440d81e8b6df174966cd",
+            "9a23d53c1e7a448282c1aaa36d26c4ec",
+            "e8e2739386c045078bf2cc3987534a93",
+            "bb14cd687abb432b8e2a01cd58e7c550",
+            "c5c6159f813949a3851fb158a992a65c",
+            "03337be3fcd94f388ae2650078269a55",
+            "ff28b23c163240dc9b543f340b9d2d52",
+            "110e8e19d5f242829cc4cafdb9a10cb2",
+            "ee6313a98fd041c9b755be6b6a94ebff",
+            "40f2cc2506fd49dd9e284c1891312785",
+            "719e9ba1b98d4170a6acff418ada38fa",
+            "1e532190fe2b49a08a97211e3f1c60d0",
+            "e0ac88aa562e4354b15e182164990a79",
+            "5e6bd272a50b4734a8a4dd4cb683d4e2",
+            "9fd8ea0a806e4641ae945dc59baa0505",
+            "941fcfabb72940a59c7fa76e3506385d",
+            "23bc61b5726942169123eca1f60bd883",
+            "b9ebd383be484f5d8fabafd4a130d6ae",
+            "afdf7f80c04848fb8978d2634ee86526"
+          ]
+        },
+        "outputId": "8feba0de-40f9-42eb-b903-68ea33e1e5ee"
+      },
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Downloading (…)okenizer_config.json:   0%|          | 0.00/28.0 [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "9972abac7caf4cc6b0d98071fd7b2e05"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Downloading (…)solve/main/vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "3a52fbc3755a4323b749da73142e5871"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Downloading (…)/main/tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "d0334d8257ce422597da3d29ac22cd4f"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Downloading (…)lve/main/config.json:   0%|          | 0.00/483 [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "ee6313a98fd041c9b755be6b6a94ebff"
+            }
+          },
+          "metadata": {}
+        }
+      ],
+      "source": [
+        "df_train = pd.read_csv('train.csv')\n",
+        "df_test = pd.read_csv('test.csv')\n",
+        "df_test_labels = pd.read_csv('test_labels.csv')\n",
+        "\n",
+        "model_name = \"distilbert-base-uncased\"\n",
+        "\n",
+        "def read_file(f):\n",
+        "  texts = f['comment_text'].tolist()\n",
+        "  labels = []\n",
+        "  for i in range(len(f)):\n",
+        "    temp = []\n",
+        "    temp.append(f['toxic'][i])\n",
+        "    temp.append(f['severe_toxic'][i])\n",
+        "    temp.append(f['obscene'][i])\n",
+        "    temp.append(f['threat'][i])\n",
+        "    temp.append(f['insult'][i])\n",
+        "    temp.append(f['identity_hate'][i])\n",
+        "    labels.append(temp)\n",
+        "  return texts, labels\n",
+        "\n",
+        "train_texts, train_labels = read_file(df_train)\n",
+        "test_texts = df_test['comment_text'].tolist()\n",
+        "test_labels = []\n",
+        "for i in range(len(df_test_labels)):\n",
+        "  temp = []\n",
+        "  temp.append(df_test_labels['toxic'][i])\n",
+        "  temp.append(df_test_labels['severe_toxic'][i])\n",
+        "  temp.append(df_test_labels['obscene'][i])\n",
+        "  temp.append(df_test_labels['threat'][i])\n",
+        "  temp.append(df_test_labels['insult'][i])\n",
+        "  temp.append(df_test_labels['identity_hate'][i])\n",
+        "  test_labels.append(temp)\n",
+        "\n",
+        "train_texts, val_texts, train_labels, val_labels = train_test_split(train_texts, train_labels, test_size=.2)\n",
+        "\n",
+        "tokenizer = DistilBertTokenizerFast.from_pretrained(model_name)\n",
+        "\n",
+        "ind = 0\n",
+        "train_encodings = {'input_ids': [], 'attention_mask': []}\n",
+        "\n",
+        "for i in range(len(train_texts)//16):\n",
+        "  temp = tokenizer(train_texts[ind:ind+16], truncation=True, padding=True)\n",
+        "  train_encodings['input_ids'] += temp['input_ids']\n",
+        "  train_encodings['attention_mask'] += temp['attention_mask']\n",
+        "  ind += 16\n",
+        "\n",
+        "ind = 0\n",
+        "val_encodings = {'input_ids': [], 'attention_mask': []}\n",
+        "\n",
+        "for i in range(len(val_texts)//16):\n",
+        "  temp = tokenizer(val_texts[ind:ind+16], truncation=True, padding=True)\n",
+        "  val_encodings['input_ids'] += temp['input_ids']\n",
+        "  val_encodings['attention_mask'] += temp['attention_mask']\n",
+        "  ind += 16\n",
+        "\n",
+        "ind = 0\n",
+        "test_encodings = {'input_ids': [], 'attention_mask': []}\n",
+        "\n",
+        "for i in range(len(test_texts)//16):\n",
+        "  temp = tokenizer(test_texts[ind:ind+16], truncation=True, padding=True)\n",
+        "  test_encodings['input_ids'] += temp['input_ids']\n",
+        "  test_encodings['attention_mask'] += temp['attention_mask']\n",
+        "  ind += 16\n",
+        "\n",
+        "while True:\n",
+        "  if len(train_labels) > len(train_encodings):\n",
+        "    train_labels.pop()\n",
+        "  else:\n",
+        "    break\n",
+        "  \n",
+        "while True:\n",
+        "  if len(val_labels) > len(val_encodings):\n",
+        "    val_labels.pop()\n",
+        "  else:\n",
+        "    break\n",
+        "\n",
+        "while True:\n",
+        "  if len(test_labels) > len(test_encodings):\n",
+        "    test_labels.pop()\n",
+        "  else:\n",
+        "    break\n",
+        "\n",
+        "class dataset(Dataset):\n",
+        "  def __init__(self, encodings, labels):\n",
+        "    self.encodings = encodings\n",
+        "    self.labels = labels\n",
+        "  \n",
+        "  def __getitem__(self, idx):\n",
+        "    item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}\n",
+        "    item['labels'] = torch.tensor(self.labels[idx])\n",
+        "    return item\n",
+        "  \n",
+        "  def __len__(self):\n",
+        "    return(len(self.labels))\n",
+        "\n",
+        "train_dataset_list = [[], [], [], [], [], []]\n",
+        "for i in train_labels:\n",
+        "  for j in range(6):\n",
+        "    train_dataset_list[j].append(i[j])\n",
+        "  \n",
+        "val_dataset_list = [[], [], [], [], [], []]\n",
+        "for i in val_labels:\n",
+        "  for j in range(6):\n",
+        "    val_dataset_list[j].append(i[j])\n",
+        "\n",
+        "train_dataset_0 = dataset(train_encodings, train_dataset_list[0])\n",
+        "train_dataset_1 = dataset(train_encodings, train_dataset_list[1])\n",
+        "train_dataset_2 = dataset(train_encodings, train_dataset_list[2])\n",
+        "train_dataset_3 = dataset(train_encodings, train_dataset_list[3])\n",
+        "train_dataset_4 = dataset(train_encodings, train_dataset_list[4])\n",
+        "train_dataset_5 = dataset(train_encodings, train_dataset_list[5])\n",
+        "\n",
+        "val_dataset_0 = dataset(val_encodings, val_dataset_list[0])\n",
+        "val_dataset_1 = dataset(val_encodings, val_dataset_list[1])\n",
+        "val_dataset_2 = dataset(val_encodings, val_dataset_list[2])\n",
+        "val_dataset_3 = dataset(val_encodings, val_dataset_list[3])\n",
+        "val_dataset_4 = dataset(val_encodings, val_dataset_list[4])\n",
+        "val_dataset_5 = dataset(val_encodings, val_dataset_list[5])"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# save tokenizer\n",
+        "tokenizer.save_pretrained(\"tokenizer.json\")"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "dc8jvgisXLhE",
+        "outputId": "876334df-a494-41fd-bd50-70cdab7936ad"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "('tokenizer.json/tokenizer_config.json',\n",
+              " 'tokenizer.json/special_tokens_map.json',\n",
+              " 'tokenizer.json/vocab.txt',\n",
+              " 'tokenizer.json/added_tokens.json',\n",
+              " 'tokenizer.json/tokenizer.json')"
+            ]
+          },
+          "metadata": {},
+          "execution_count": 9
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# training_args = TrainingArguments(output_dir='Rathgeberj/milestone3_fine_tuned', \n",
+        "#                                   push_to_hub=True, \n",
+        "#                                   num_train_epochs=2, \n",
+        "#                                   per_device_train_batch_size=16, \n",
+        "#                                   per_device_eval_batch_size=64, \n",
+        "#                                   warmup_steps=500, learning_rate=5e-5, \n",
+        "#                                   weight_decay=.01, logging_dir='./logs', \n",
+        "#                                   logging_steps=10)\n",
+        "# /Users/jeffreyrathgeber\n",
+        "\n",
+        "training_args = TrainingArguments(output_dir='results', \n",
+        "                                  num_train_epochs=2, \n",
+        "                                  per_device_train_batch_size=16, \n",
+        "                                  per_device_eval_batch_size=64, \n",
+        "                                  warmup_steps=500, learning_rate=5e-5, \n",
+        "                                  weight_decay=.01, logging_dir='./logs', \n",
+        "                                  logging_steps=10)\n",
+        "\n",
+        "model_0 = DistilBertForSequenceClassification.from_pretrained(model_name)\n",
+        "model_1 = DistilBertForSequenceClassification.from_pretrained(model_name)\n",
+        "model_2 = DistilBertForSequenceClassification.from_pretrained(model_name)\n",
+        "model_3 = DistilBertForSequenceClassification.from_pretrained(model_name)\n",
+        "model_4 = DistilBertForSequenceClassification.from_pretrained(model_name)\n",
+        "model_5 = DistilBertForSequenceClassification.from_pretrained(model_name)"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 563,
+          "referenced_widgets": [
+            "a828e2eb329548568ea23df75056ce46",
+            "94f47a73ba5b402b84717807b4f127d9",
+            "66f521247f4c4a608e4a79933ca8b499",
+            "9012d483dc42427189bea7c35c6a9f21",
+            "342182d835634efd9e8dcc16c753602b",
+            "a8c8ad17737448748e212de8bba42b5f",
+            "e414907cc96e4e3d879a6759124fd8fe",
+            "a464bcc2342841588e7384b4c2f10a42",
+            "6cc18dcc7a7d4361a5aac3271d47347a",
+            "cb8c4e778a994ba7bb57f279614ebfe8",
+            "739f16b75f3248489495a606ab3650ab"
+          ]
+        },
+        "id": "1FrCJtT23YVX",
+        "outputId": "5311555b-7789-4bd5-8931-4abc9b70360e"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Downloading pytorch_model.bin:   0%|          | 0.00/268M [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "a828e2eb329548568ea23df75056ce46"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+            "Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_projector.bias', 'vocab_projector.weight']\n",
+            "- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+            "- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+            "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.bias', 'classifier.bias', 'pre_classifier.weight']\n",
+            "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
+          ]
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_0 = Trainer(model=model_0, args=training_args, train_dataset=train_dataset_0, eval_dataset=val_dataset_0)\n",
+        "trainer_0.train()\n",
+        "trainer_0.save_model(output_dir='NEW')"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 127
+        },
+        "id": "_iaP4g715FZl",
+        "outputId": "feab2bf7-e30a-4282-8f34-4d45bf2baf55"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "/usr/local/lib/python3.9/dist-packages/transformers/optimization.py:391: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
+            "  warnings.warn(\n"
+          ]
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:04, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_1 = Trainer(model=model_1, args=training_args, train_dataset=train_dataset_1, eval_dataset=val_dataset_1)\n",
+        "trainer_1.train()\n",
+        "trainer_1.save_model(output_dir='UPDATED_1')"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 74
+        },
+        "id": "q6hRKNNgGrVB",
+        "outputId": "8dddc83c-4292-424c-8534-61d8125ecac5"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:09, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_2 = Trainer(model=model_2, args=training_args, train_dataset=train_dataset_2, eval_dataset=val_dataset_2)\n",
+        "trainer_2.train()\n",
+        "trainer_2.save_model(output_dir='UPDATED_2')\n"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 74
+        },
+        "id": "UwuqSkNdGrgk",
+        "outputId": "ecc6c398-36d1-40c3-a7ca-0ad99cf0369e"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:03, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_3 = Trainer(model=model_3, args=training_args, train_dataset=train_dataset_3, eval_dataset=val_dataset_3)\n",
+        "trainer_3.train()\n",
+        "trainer_3.save_model(output_dir='UPDATED_3')"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 74
+        },
+        "id": "TbysKTvgGrqJ",
+        "outputId": "e8f04274-92f8-439e-b567-75d589eaaa1b"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:03, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_4 = Trainer(model=model_4, args=training_args, train_dataset=train_dataset_4, eval_dataset=val_dataset_4)\n",
+        "trainer_4.train()\n",
+        "trainer_4.save_model(output_dir='UPDATED_4')"
+      ],
+      "metadata": {
+        "id": "VTJ-4cENGr05",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 74
+        },
+        "outputId": "54cc3a64-c511-4484-c09f-f8ffe2ff65d7"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:03, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "trainer_5 = Trainer(model=model_5, args=training_args, train_dataset=train_dataset_5, eval_dataset=val_dataset_5)\n",
+        "trainer_5.train()\n",
+        "trainer_5.save_model(output_dir='UPDATED_5')"
+      ],
+      "metadata": {
+        "id": "mgIWDFQ2HtXL",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 74
+        },
+        "outputId": "7cddb662-1c2f-4923-c747-866ec6f3297d"
+      },
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "\n",
+              "    <div>\n",
+              "      \n",
+              "      <progress value='2' max='2' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+              "      [2/2 00:03, Epoch 2/2]\n",
+              "    </div>\n",
+              "    <table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              " <tr style=\"text-align: left;\">\n",
+              "      <th>Step</th>\n",
+              "      <th>Training Loss</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "  </tbody>\n",
+              "</table><p>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    }
+  ]
+}

aiprojecttest.py DELETED Viewed

@@ -1,215 +0,0 @@
-# -*- coding: utf-8 -*-
-"""AiProjectTest.ipynb
-Automatically generated by Colaboratory.
-Original file is located at
-    https://colab.research.google.com/drive/1E4AHYbuRi_FbOMhQntdAMMZMY14hWh2e
-"""
-from pathlib import Path
-from sklearn.model_selection import train_test_split
-import torch
-from torch.utils.data import Dataset
-from transformers import DistilBertTokenizerFast, DistilBertForSequenceClassification
-from transformers import Trainer, TrainingArguments
-from torch.utils.data import DataLoader
-from transformers import AdamW
-import pandas as pd
-df_train = pd.read_csv('train.csv')
-df_test = pd.read_csv('test.csv')
-df_test_labels = pd.read_csv('test_labels.csv')
-model_name = "distilbert-base-uncased"
-def read_file(f):
-  texts = f['comment_text'].tolist()
-  labels = []
-  for i in range(len(f)):
-    temp = []
-    temp.append(f['toxic'][i])
-    temp.append(f['severe_toxic'][i])
-    temp.append(f['obscene'][i])
-    temp.append(f['threat'][i])
-    temp.append(f['insult'][i])
-    temp.append(f['identity_hate'][i])
-    labels.append(temp)
-  return texts, labels
-train_texts, train_labels = read_file(df_train)
-test_texts = df_test['comment_text'].tolist()
-test_labels = []
-for i in range(len(df_test_labels)):
-  temp = []
-  temp.append(df_test_labels['toxic'][i])
-  temp.append(df_test_labels['severe_toxic'][i])
-  temp.append(df_test_labels['obscene'][i])
-  temp.append(df_test_labels['threat'][i])
-  temp.append(df_test_labels['insult'][i])
-  temp.append(df_test_labels['identity_hate'][i])
-  test_labels.append(temp)
-train_texts, val_texts, train_labels, val_labels = train_test_split(train_texts, train_labels, test_size=.2)
-tokenizer = DistilBertTokenizerFast.from_pretrained(model_name)
-ind = 0
-train_encodings = {'input_ids': [], 'attention_mask': []}
-for i in range(len(train_texts)//16):
-  temp = tokenizer(train_texts[ind:ind+16], truncation=True, padding=True)
-  train_encodings['input_ids'] += temp['input_ids']
-  train_encodings['attention_mask'] += temp['attention_mask']
-  ind += 16
-ind = 0
-val_encodings = {'input_ids': [], 'attention_mask': []}
-for i in range(len(val_texts)//16):
-  temp = tokenizer(val_texts[ind:ind+16], truncation=True, padding=True)
-  val_encodings['input_ids'] += temp['input_ids']
-  val_encodings['attention_mask'] += temp['attention_mask']
-  ind += 16
-ind = 0
-test_encodings = {'input_ids': [], 'attention_mask': []}
-for i in range(len(test_texts)//16):
-  temp = tokenizer(test_texts[ind:ind+16], truncation=True, padding=True)
-  test_encodings['input_ids'] += temp['input_ids']
-  test_encodings['attention_mask'] += temp['attention_mask']
-  ind += 16
-while True:
-  if len(train_labels) > len(train_encodings):
-    train_labels.pop()
-  else:
-    break
-while True:
-  if len(val_labels) > len(val_encodings):
-    val_labels.pop()
-  else:
-    break
-while True:
-  if len(test_labels) > len(test_encodings):
-    test_labels.pop()
-  else:
-    break
-class dataset(Dataset):
-  def __init__(self, encodings, labels):
-    self.encodings = encodings
-    self.labels = labels
-  def __getitem__(self, idx):
-    item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
-    item['labels'] = torch.tensor(self.labels[idx])
-    return item
-  def __len__(self):
-    return(len(self.labels))
-train_dataset_list = [[], [], [], [], [], []]
-for i in train_labels:
-  for j in range(6):
-    train_dataset_list[j].append(i[j])
-val_dataset_list = [[], [], [], [], [], []]
-for i in val_labels:
-  for j in range(6):
-    val_dataset_list[j].append(i[j])
-train_dataset_0 = dataset(train_encodings, train_dataset_list[0])
-train_dataset_1 = dataset(train_encodings, train_dataset_list[1])
-train_dataset_2 = dataset(train_encodings, train_dataset_list[2])
-train_dataset_3 = dataset(train_encodings, train_dataset_list[3])
-train_dataset_4 = dataset(train_encodings, train_dataset_list[4])
-train_dataset_5 = dataset(train_encodings, train_dataset_list[5])
-val_dataset_0 = dataset(val_encodings, val_dataset_list[0])
-val_dataset_1 = dataset(val_encodings, val_dataset_list[1])
-val_dataset_2 = dataset(val_encodings, val_dataset_list[2])
-val_dataset_3 = dataset(val_encodings, val_dataset_list[3])
-val_dataset_4 = dataset(val_encodings, val_dataset_list[4])
-val_dataset_5 = dataset(val_encodings, val_dataset_list[5])
-training_args = TrainingArguments(output_dir='./results',
-                                  num_train_epochs=2,
-                                  per_device_train_batch_size=16,
-                                  per_device_eval_batch_size=64,
-                                  warmup_steps=500, learning_rate=5e-5,
-                                  weight_decay=.01, logging_dir='./logs',
-                                  logging_steps=10)
-model = DistilBertForSequenceClassification.from_pretrained(model_name)
-trainer_0 = Trainer(model=model, args=training_args, train_dataset=train_dataset_0, eval_dataset=val_dataset_0)
-trainer_0.train()
-trainer_1 = Trainer(model=model, args=training_args, train_dataset=train_dataset_1, eval_dataset=val_dataset_1)
-trainer_1.train()
-trainer_2 = Trainer(model=model, args=training_args, train_dataset=train_dataset_2, eval_dataset=val_dataset_2)
-trainer_2.train()
-trainer_3 = Trainer(model=model, args=training_args, train_dataset=train_dataset_3, eval_dataset=val_dataset_3)
-trainer_3.train()
-trainer_4 = Trainer(model=model, args=training_args, train_dataset=train_dataset_4, eval_dataset=val_dataset_4)
-trainer_4.train()
-trainer_5 = Trainer(model=model, args=training_args, train_dataset=train_dataset_5, eval_dataset=val_dataset_5)
-trainer_5.train()
-# train_dataset = dataset(train_encodings, train_labels)
-# val_dataset = dataset(val_encodings, val_labels)
-# test_dataset = dataset(test_encodings, test_labels)
-# -----------------------------------------------------------------
-# test_dataset_list = [[], [], [], [], [], []]
-# for i in test_labels:
-#   for j in range(6):
-#     test_dataset_list[j].append(i[j])
-# -----------------------------------------------------------------
-# val_dataset = dataset(val_encodings, val_labels)
-# test_dataset_0 = dataset(test_encodings, test_dataset_list[0])
-# test_dataset_1 = dataset(test_encodings, test_dataset_list[1])
-# test_dataset_2 = dataset(test_encodings, test_dataset_list[2])
-# test_dataset_3 = dataset(test_encodings, test_dataset_list[3])
-# test_dataset_4 = dataset(test_encodings, test_dataset_list[4])
-# test_dataset_5 = dataset(test_encodings, test_dataset_list[5])
-# -----------------------------------------------------------------
-# device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
-# model = DistilBertForSequenceClassification.from_pretrained('distilbert-base-uncased')
-# model.to(device)
-# model.train()
-# train_loader = DataLoader(train_dataset_0, batch_size=16, shuffle=True)
-# optim = AdamW(model.parameters(), lr=5e-5)
-# num_train_epochs = 2
-# for epoch in range(num_train_epochs):
-#     for batch in train_loader:
-#         optim.zero_grad()
-#         input_ids = batch['input_ids'].to(device)
-#         attention_mask = batch['attention_mask'].to(device)
-#         labels = batch['labels'].to(device)
-#         outputs = model(input_ids, attention_mask=attention_mask, labels=labels)
-#         loss = outputs[0]
-#         loss.backward()
-#         optim.step()
-# model.eval()

app.py CHANGED Viewed

@@ -183,4 +183,3 @@ if option == 'TextBlob':
 # tokenizer = AutoTokenizer.from_pretrained(save_directory)
 # model = AutoModelForSequenceClassification.from_pretrained(save_directory)
-#------------------------------------------------------------------------


183	# tokenizer = AutoTokenizer.from_pretrained(save_directory)
184	# model = AutoModelForSequenceClassification.from_pretrained(save_directory)
185