{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "9972abac7caf4cc6b0d98071fd7b2e05": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_b53fb6f416d8458bb0875cbace688913", "IPY_MODEL_a25b06ec34a44529bd5bd686a9a381e5", "IPY_MODEL_52da3fef70074ddf95a3b257dcf4b100" ], "layout": "IPY_MODEL_932e4324d43346e48c85af3e5d5b45c1" } }, "b53fb6f416d8458bb0875cbace688913": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_13d5e786f6294da2b6e5d90ca06c8593", "placeholder": "​", "style": "IPY_MODEL_bbfa5943bc1c41dbaf3a2ef89ac8d0b3", "value": "Downloading (…)okenizer_config.json: 100%" } }, "a25b06ec34a44529bd5bd686a9a381e5": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3ce089610ec446c19db3bae1baa45d7a", "max": 28, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_bcf06ca3212c43e0a5db7e7d4ea01375", "value": 28 } }, "52da3fef70074ddf95a3b257dcf4b100": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_aab6a478cec84b25a29bc0ed4ee2aaac", "placeholder": "​", "style": "IPY_MODEL_3e6f987e297b4a2b8f3eb1b12b4b67af", "value": " 28.0/28.0 [00:00<00:00, 1.28kB/s]" } }, "932e4324d43346e48c85af3e5d5b45c1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "13d5e786f6294da2b6e5d90ca06c8593": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bbfa5943bc1c41dbaf3a2ef89ac8d0b3": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "3ce089610ec446c19db3bae1baa45d7a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bcf06ca3212c43e0a5db7e7d4ea01375": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "aab6a478cec84b25a29bc0ed4ee2aaac": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3e6f987e297b4a2b8f3eb1b12b4b67af": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "3a52fbc3755a4323b749da73142e5871": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_7b2019506d154d118134985ee7e8ea43", "IPY_MODEL_3a51d4dbd7654b9ab7b69a50605d29e9", "IPY_MODEL_c5dd0d556c9c486baaedf3ca54cef54a" ], "layout": "IPY_MODEL_3b40837351f44c0f92e3e5af55da3e21" } }, "7b2019506d154d118134985ee7e8ea43": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_85a7a49bf87c4160b241a878c6b12f81", "placeholder": "​", "style": "IPY_MODEL_9510c227a23e4d829ad9366b41babae6", "value": "Downloading (…)solve/main/vocab.txt: 100%" } }, "3a51d4dbd7654b9ab7b69a50605d29e9": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b78852da0af54675a3a1b65729eed99f", "max": 231508, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_5638394766b640cdaf9208a8794636d2", "value": 231508 } }, "c5dd0d556c9c486baaedf3ca54cef54a": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_67535c820a3b407bb801873d788ba535", "placeholder": "​", "style": "IPY_MODEL_365db64fb2c847a5a41b5d057d77600c", "value": " 232k/232k [00:00<00:00, 6.66MB/s]" } }, "3b40837351f44c0f92e3e5af55da3e21": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "85a7a49bf87c4160b241a878c6b12f81": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "9510c227a23e4d829ad9366b41babae6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "b78852da0af54675a3a1b65729eed99f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "5638394766b640cdaf9208a8794636d2": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "67535c820a3b407bb801873d788ba535": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "365db64fb2c847a5a41b5d057d77600c": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "d0334d8257ce422597da3d29ac22cd4f": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_eae4e7789fe54a7b98bfda99d20360bd", "IPY_MODEL_5f48726592fe446ea43b7bdec668919b", "IPY_MODEL_3edcc888477a440d81e8b6df174966cd" ], "layout": "IPY_MODEL_9a23d53c1e7a448282c1aaa36d26c4ec" } }, "eae4e7789fe54a7b98bfda99d20360bd": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e8e2739386c045078bf2cc3987534a93", "placeholder": "​", "style": "IPY_MODEL_bb14cd687abb432b8e2a01cd58e7c550", "value": "Downloading (…)/main/tokenizer.json: 100%" } }, "5f48726592fe446ea43b7bdec668919b": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c5c6159f813949a3851fb158a992a65c", "max": 466062, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_03337be3fcd94f388ae2650078269a55", "value": 466062 } }, "3edcc888477a440d81e8b6df174966cd": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ff28b23c163240dc9b543f340b9d2d52", "placeholder": "​", "style": "IPY_MODEL_110e8e19d5f242829cc4cafdb9a10cb2", "value": " 466k/466k [00:00<00:00, 15.5MB/s]" } }, "9a23d53c1e7a448282c1aaa36d26c4ec": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e8e2739386c045078bf2cc3987534a93": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bb14cd687abb432b8e2a01cd58e7c550": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "c5c6159f813949a3851fb158a992a65c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "03337be3fcd94f388ae2650078269a55": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "ff28b23c163240dc9b543f340b9d2d52": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "110e8e19d5f242829cc4cafdb9a10cb2": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "ee6313a98fd041c9b755be6b6a94ebff": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_40f2cc2506fd49dd9e284c1891312785", "IPY_MODEL_719e9ba1b98d4170a6acff418ada38fa", "IPY_MODEL_1e532190fe2b49a08a97211e3f1c60d0" ], "layout": "IPY_MODEL_e0ac88aa562e4354b15e182164990a79" } }, "40f2cc2506fd49dd9e284c1891312785": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5e6bd272a50b4734a8a4dd4cb683d4e2", "placeholder": "​", "style": "IPY_MODEL_9fd8ea0a806e4641ae945dc59baa0505", "value": "Downloading (…)lve/main/config.json: 100%" } }, "719e9ba1b98d4170a6acff418ada38fa": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_941fcfabb72940a59c7fa76e3506385d", "max": 483, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_23bc61b5726942169123eca1f60bd883", "value": 483 } }, "1e532190fe2b49a08a97211e3f1c60d0": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b9ebd383be484f5d8fabafd4a130d6ae", "placeholder": "​", "style": "IPY_MODEL_afdf7f80c04848fb8978d2634ee86526", "value": " 483/483 [00:00<00:00, 30.4kB/s]" } }, "e0ac88aa562e4354b15e182164990a79": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "5e6bd272a50b4734a8a4dd4cb683d4e2": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "9fd8ea0a806e4641ae945dc59baa0505": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "941fcfabb72940a59c7fa76e3506385d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "23bc61b5726942169123eca1f60bd883": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "b9ebd383be484f5d8fabafd4a130d6ae": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "afdf7f80c04848fb8978d2634ee86526": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a828e2eb329548568ea23df75056ce46": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_94f47a73ba5b402b84717807b4f127d9", "IPY_MODEL_66f521247f4c4a608e4a79933ca8b499", "IPY_MODEL_9012d483dc42427189bea7c35c6a9f21" ], "layout": "IPY_MODEL_342182d835634efd9e8dcc16c753602b" } }, "94f47a73ba5b402b84717807b4f127d9": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a8c8ad17737448748e212de8bba42b5f", "placeholder": "​", "style": "IPY_MODEL_e414907cc96e4e3d879a6759124fd8fe", "value": "Downloading pytorch_model.bin: 100%" } }, "66f521247f4c4a608e4a79933ca8b499": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a464bcc2342841588e7384b4c2f10a42", "max": 267967963, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_6cc18dcc7a7d4361a5aac3271d47347a", "value": 267967963 } }, "9012d483dc42427189bea7c35c6a9f21": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cb8c4e778a994ba7bb57f279614ebfe8", "placeholder": "​", "style": "IPY_MODEL_739f16b75f3248489495a606ab3650ab", "value": " 268M/268M [00:00<00:00, 372MB/s]" } }, "342182d835634efd9e8dcc16c753602b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a8c8ad17737448748e212de8bba42b5f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e414907cc96e4e3d879a6759124fd8fe": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a464bcc2342841588e7384b4c2f10a42": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "6cc18dcc7a7d4361a5aac3271d47347a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "cb8c4e778a994ba7bb57f279614ebfe8": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "739f16b75f3248489495a606ab3650ab": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "code", "source": [ "from pathlib import Path\n", "from sklearn.model_selection import train_test_split\n", "import torch\n", "from torch.utils.data import Dataset\n", "from transformers import DistilBertTokenizerFast, DistilBertForSequenceClassification\n", "from transformers import Trainer, TrainingArguments\n", "from torch.utils.data import DataLoader\n", "from transformers import AdamW\n", "import pandas as pd\n", "from huggingface_hub import notebook_login" ], "metadata": { "id": "Bu9ttXsprt9w" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "UCoa8JqwrVXU", "colab": { "base_uri": "https://localhost:8080/", "height": 144, "referenced_widgets": [ "9972abac7caf4cc6b0d98071fd7b2e05", "b53fb6f416d8458bb0875cbace688913", "a25b06ec34a44529bd5bd686a9a381e5", "52da3fef70074ddf95a3b257dcf4b100", "932e4324d43346e48c85af3e5d5b45c1", "13d5e786f6294da2b6e5d90ca06c8593", "bbfa5943bc1c41dbaf3a2ef89ac8d0b3", "3ce089610ec446c19db3bae1baa45d7a", "bcf06ca3212c43e0a5db7e7d4ea01375", "aab6a478cec84b25a29bc0ed4ee2aaac", "3e6f987e297b4a2b8f3eb1b12b4b67af", "3a52fbc3755a4323b749da73142e5871", "7b2019506d154d118134985ee7e8ea43", "3a51d4dbd7654b9ab7b69a50605d29e9", "c5dd0d556c9c486baaedf3ca54cef54a", "3b40837351f44c0f92e3e5af55da3e21", "85a7a49bf87c4160b241a878c6b12f81", "9510c227a23e4d829ad9366b41babae6", "b78852da0af54675a3a1b65729eed99f", "5638394766b640cdaf9208a8794636d2", "67535c820a3b407bb801873d788ba535", "365db64fb2c847a5a41b5d057d77600c", "d0334d8257ce422597da3d29ac22cd4f", "eae4e7789fe54a7b98bfda99d20360bd", "5f48726592fe446ea43b7bdec668919b", "3edcc888477a440d81e8b6df174966cd", "9a23d53c1e7a448282c1aaa36d26c4ec", "e8e2739386c045078bf2cc3987534a93", "bb14cd687abb432b8e2a01cd58e7c550", "c5c6159f813949a3851fb158a992a65c", "03337be3fcd94f388ae2650078269a55", "ff28b23c163240dc9b543f340b9d2d52", "110e8e19d5f242829cc4cafdb9a10cb2", "ee6313a98fd041c9b755be6b6a94ebff", "40f2cc2506fd49dd9e284c1891312785", "719e9ba1b98d4170a6acff418ada38fa", "1e532190fe2b49a08a97211e3f1c60d0", "e0ac88aa562e4354b15e182164990a79", "5e6bd272a50b4734a8a4dd4cb683d4e2", "9fd8ea0a806e4641ae945dc59baa0505", "941fcfabb72940a59c7fa76e3506385d", "23bc61b5726942169123eca1f60bd883", "b9ebd383be484f5d8fabafd4a130d6ae", "afdf7f80c04848fb8978d2634ee86526" ] }, "outputId": "8feba0de-40f9-42eb-b903-68ea33e1e5ee" }, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Downloading (…)okenizer_config.json: 0%| | 0.00/28.0 [00:00 len(train_encodings):\n", " train_labels.pop()\n", " else:\n", " break\n", " \n", "while True:\n", " if len(val_labels) > len(val_encodings):\n", " val_labels.pop()\n", " else:\n", " break\n", "\n", "while True:\n", " if len(test_labels) > len(test_encodings):\n", " test_labels.pop()\n", " else:\n", " break\n", "\n", "class dataset(Dataset):\n", " def __init__(self, encodings, labels):\n", " self.encodings = encodings\n", " self.labels = labels\n", " \n", " def __getitem__(self, idx):\n", " item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}\n", " item['labels'] = torch.tensor(self.labels[idx])\n", " return item\n", " \n", " def __len__(self):\n", " return(len(self.labels))\n", "\n", "train_dataset_list = [[], [], [], [], [], []]\n", "for i in train_labels:\n", " for j in range(6):\n", " train_dataset_list[j].append(i[j])\n", " \n", "val_dataset_list = [[], [], [], [], [], []]\n", "for i in val_labels:\n", " for j in range(6):\n", " val_dataset_list[j].append(i[j])\n", "\n", "train_dataset_0 = dataset(train_encodings, train_dataset_list[0])\n", "train_dataset_1 = dataset(train_encodings, train_dataset_list[1])\n", "train_dataset_2 = dataset(train_encodings, train_dataset_list[2])\n", "train_dataset_3 = dataset(train_encodings, train_dataset_list[3])\n", "train_dataset_4 = dataset(train_encodings, train_dataset_list[4])\n", "train_dataset_5 = dataset(train_encodings, train_dataset_list[5])\n", "\n", "val_dataset_0 = dataset(val_encodings, val_dataset_list[0])\n", "val_dataset_1 = dataset(val_encodings, val_dataset_list[1])\n", "val_dataset_2 = dataset(val_encodings, val_dataset_list[2])\n", "val_dataset_3 = dataset(val_encodings, val_dataset_list[3])\n", "val_dataset_4 = dataset(val_encodings, val_dataset_list[4])\n", "val_dataset_5 = dataset(val_encodings, val_dataset_list[5])" ] }, { "cell_type": "code", "source": [ "# save tokenizer\n", "tokenizer.save_pretrained(\"tokenizer.json\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "dc8jvgisXLhE", "outputId": "876334df-a494-41fd-bd50-70cdab7936ad" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "('tokenizer.json/tokenizer_config.json',\n", " 'tokenizer.json/special_tokens_map.json',\n", " 'tokenizer.json/vocab.txt',\n", " 'tokenizer.json/added_tokens.json',\n", " 'tokenizer.json/tokenizer.json')" ] }, "metadata": {}, "execution_count": 9 } ] }, { "cell_type": "code", "source": [ "# training_args = TrainingArguments(output_dir='Rathgeberj/milestone3_fine_tuned', \n", "# push_to_hub=True, \n", "# num_train_epochs=2, \n", "# per_device_train_batch_size=16, \n", "# per_device_eval_batch_size=64, \n", "# warmup_steps=500, learning_rate=5e-5, \n", "# weight_decay=.01, logging_dir='./logs', \n", "# logging_steps=10)\n", "# /Users/jeffreyrathgeber\n", "\n", "training_args = TrainingArguments(output_dir='results', \n", " num_train_epochs=2, \n", " per_device_train_batch_size=16, \n", " per_device_eval_batch_size=64, \n", " warmup_steps=500, learning_rate=5e-5, \n", " weight_decay=.01, logging_dir='./logs', \n", " logging_steps=10)\n", "\n", "model_0 = DistilBertForSequenceClassification.from_pretrained(model_name)\n", "model_1 = DistilBertForSequenceClassification.from_pretrained(model_name)\n", "model_2 = DistilBertForSequenceClassification.from_pretrained(model_name)\n", "model_3 = DistilBertForSequenceClassification.from_pretrained(model_name)\n", "model_4 = DistilBertForSequenceClassification.from_pretrained(model_name)\n", "model_5 = DistilBertForSequenceClassification.from_pretrained(model_name)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 563, "referenced_widgets": [ "a828e2eb329548568ea23df75056ce46", "94f47a73ba5b402b84717807b4f127d9", "66f521247f4c4a608e4a79933ca8b499", "9012d483dc42427189bea7c35c6a9f21", "342182d835634efd9e8dcc16c753602b", "a8c8ad17737448748e212de8bba42b5f", "e414907cc96e4e3d879a6759124fd8fe", "a464bcc2342841588e7384b4c2f10a42", "6cc18dcc7a7d4361a5aac3271d47347a", "cb8c4e778a994ba7bb57f279614ebfe8", "739f16b75f3248489495a606ab3650ab" ] }, "id": "1FrCJtT23YVX", "outputId": "5311555b-7789-4bd5-8931-4abc9b70360e" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Downloading pytorch_model.bin: 0%| | 0.00/268M [00:00" ], "text/html": [ "\n", "
\n", " \n", " \n", " [2/2 00:04, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "trainer_1 = Trainer(model=model_1, args=training_args, train_dataset=train_dataset_1, eval_dataset=val_dataset_1)\n", "trainer_1.train()\n", "trainer_1.save_model(output_dir='UPDATED_1')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 74 }, "id": "q6hRKNNgGrVB", "outputId": "8dddc83c-4292-424c-8534-61d8125ecac5" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [2/2 00:09, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "trainer_2 = Trainer(model=model_2, args=training_args, train_dataset=train_dataset_2, eval_dataset=val_dataset_2)\n", "trainer_2.train()\n", "trainer_2.save_model(output_dir='UPDATED_2')\n" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 74 }, "id": "UwuqSkNdGrgk", "outputId": "ecc6c398-36d1-40c3-a7ca-0ad99cf0369e" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [2/2 00:03, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "trainer_3 = Trainer(model=model_3, args=training_args, train_dataset=train_dataset_3, eval_dataset=val_dataset_3)\n", "trainer_3.train()\n", "trainer_3.save_model(output_dir='UPDATED_3')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 74 }, "id": "TbysKTvgGrqJ", "outputId": "e8f04274-92f8-439e-b567-75d589eaaa1b" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [2/2 00:03, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "trainer_4 = Trainer(model=model_4, args=training_args, train_dataset=train_dataset_4, eval_dataset=val_dataset_4)\n", "trainer_4.train()\n", "trainer_4.save_model(output_dir='UPDATED_4')" ], "metadata": { "id": "VTJ-4cENGr05", "colab": { "base_uri": "https://localhost:8080/", "height": 74 }, "outputId": "54cc3a64-c511-4484-c09f-f8ffe2ff65d7" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [2/2 00:03, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "trainer_5 = Trainer(model=model_5, args=training_args, train_dataset=train_dataset_5, eval_dataset=val_dataset_5)\n", "trainer_5.train()\n", "trainer_5.save_model(output_dir='UPDATED_5')" ], "metadata": { "id": "mgIWDFQ2HtXL", "colab": { "base_uri": "https://localhost:8080/", "height": 74 }, "outputId": "7cddb662-1c2f-4923-c747-866ec6f3297d" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [2/2 00:03, Epoch 2/2]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss

" ] }, "metadata": {} } ] } ] }