{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "gpuType": "A100" }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "fb2393ca9dd245a6aa277e1cc31db03b": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_f948bb92d53f4cb080b36c7b6dfe95cf", "IPY_MODEL_cb31c9997f7f4c629db5c304986d505e", "IPY_MODEL_6cf67a0118df4c0a9064baed0116dd07" ], "layout": "IPY_MODEL_f3b00df2056a43d4bb4485fc18374a32" } }, "f948bb92d53f4cb080b36c7b6dfe95cf": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d4e1625ab0bc4a75bb14a457e1fffc2b", "placeholder": "​", "style": "IPY_MODEL_eb6e36a9ad5f4e7c9ba923ea38da03f6", "value": "tokenizer_config.json: 100%" } }, "cb31c9997f7f4c629db5c304986d505e": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8131735faf234d80b6aa448ce871fff6", "max": 26, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_bbe035370c064c41beca92e54ff4b82a", "value": 26 } }, "6cf67a0118df4c0a9064baed0116dd07": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f3dc11d89e474bd6a683b8f6406c652d", "placeholder": "​", "style": "IPY_MODEL_1a2803e4504a4c9ba0c27ae02e02416e", "value": " 26.0/26.0 [00:00<00:00, 2.08kB/s]" } }, "f3b00df2056a43d4bb4485fc18374a32": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d4e1625ab0bc4a75bb14a457e1fffc2b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "eb6e36a9ad5f4e7c9ba923ea38da03f6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "8131735faf234d80b6aa448ce871fff6": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bbe035370c064c41beca92e54ff4b82a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "f3dc11d89e474bd6a683b8f6406c652d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "1a2803e4504a4c9ba0c27ae02e02416e": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "24291aa0933a450ab056fbdc926e3d55": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_c1aaba1b6c8748aeb3c9463804f654f1", "IPY_MODEL_06ebbf05e8b141cb8f62777f9bc0eac0", "IPY_MODEL_f5562a8ce84a47698c6ea86dbff2874b" ], "layout": "IPY_MODEL_5e9744f1e20e462f98515fd590636817" } }, "c1aaba1b6c8748aeb3c9463804f654f1": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0e286fa5c7c240c49a6bdd596175b2b5", "placeholder": "​", "style": "IPY_MODEL_8394c69a136b450eac324e55eda462b0", "value": "config.json: 100%" } }, "06ebbf05e8b141cb8f62777f9bc0eac0": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_89661f4ab03e4236980d012fb916b8b1", "max": 666, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_1b28439538044b51bf48bbce7588492c", "value": 666 } }, "f5562a8ce84a47698c6ea86dbff2874b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2a341ff92a09496db4f4674dab691d5f", "placeholder": "​", "style": "IPY_MODEL_75e619fafd424abd80ac02a284e93260", "value": " 666/666 [00:00<00:00, 47.2kB/s]" } }, "5e9744f1e20e462f98515fd590636817": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "0e286fa5c7c240c49a6bdd596175b2b5": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "8394c69a136b450eac324e55eda462b0": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "89661f4ab03e4236980d012fb916b8b1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "1b28439538044b51bf48bbce7588492c": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "2a341ff92a09496db4f4674dab691d5f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "75e619fafd424abd80ac02a284e93260": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "cdb6fe00e4c24a03b51d291f8f3ba79b": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_0256c1d5581643f4a3ce2a8bc8e9004c", "IPY_MODEL_5976b3abbcb240d38e871b52f9285839", "IPY_MODEL_b8b157535f824bc684602cc333b00c63" ], "layout": "IPY_MODEL_676df78144394dc3b331c7438295f20e" } }, "0256c1d5581643f4a3ce2a8bc8e9004c": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a9adbbd4f7df4cb7aba88618800ca9f1", "placeholder": "​", "style": "IPY_MODEL_3947c6b5b3414745a3534628b24c0eb8", "value": "vocab.json: 100%" } }, "5976b3abbcb240d38e871b52f9285839": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f960228546324c87a59846c0e764a6f3", "max": 1042301, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_15c5d725ded246009f6d5aef65cb7533", "value": 1042301 } }, "b8b157535f824bc684602cc333b00c63": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d756fabb8b7d4ff2b5855d58a5ba3929", "placeholder": "​", "style": "IPY_MODEL_4a27186407f14bd98df85422f6c86c21", "value": " 1.04M/1.04M [00:00<00:00, 4.20MB/s]" } }, "676df78144394dc3b331c7438295f20e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a9adbbd4f7df4cb7aba88618800ca9f1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3947c6b5b3414745a3534628b24c0eb8": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "f960228546324c87a59846c0e764a6f3": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "15c5d725ded246009f6d5aef65cb7533": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "d756fabb8b7d4ff2b5855d58a5ba3929": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4a27186407f14bd98df85422f6c86c21": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "f8e52609a94b4c94b9eac92b86228f48": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_2cfabbfe73164eafb939090b43bc197b", "IPY_MODEL_4e2b693b5255430eb2fdd177485a9bba", "IPY_MODEL_be133213af3e40adbe56df950f70e21f" ], "layout": "IPY_MODEL_86f383cb0293497aab584ee35ffe1b19" } }, "2cfabbfe73164eafb939090b43bc197b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cf3dee2789bd43c391c1d17eaa5eb0af", "placeholder": "​", "style": "IPY_MODEL_ae783df0495841de974e12357c15fbe9", "value": "merges.txt: 100%" } }, "4e2b693b5255430eb2fdd177485a9bba": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2830d535c34e4e209ce9a0db1925ed3d", "max": 456318, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_27a857844bea40d883975cee7b244f9a", "value": 456318 } }, "be133213af3e40adbe56df950f70e21f": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1e4e6c854cc4473aa8c8deb88a24cf87", "placeholder": "​", "style": "IPY_MODEL_dacdf48c3fd443ac863ea92fcf3dea10", "value": " 456k/456k [00:00<00:00, 16.3MB/s]" } }, "86f383cb0293497aab584ee35ffe1b19": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "cf3dee2789bd43c391c1d17eaa5eb0af": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ae783df0495841de974e12357c15fbe9": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "2830d535c34e4e209ce9a0db1925ed3d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "27a857844bea40d883975cee7b244f9a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "1e4e6c854cc4473aa8c8deb88a24cf87": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "dacdf48c3fd443ac863ea92fcf3dea10": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "4d77313b684c4841b166c57acca822ed": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_cf177dc87cc24d0387d318e9837e74bd", "IPY_MODEL_11c83b5b7f044e9d86f2eb8e389859a6", "IPY_MODEL_d2763d28508543bd88458615d791baca" ], "layout": "IPY_MODEL_73cc99094f184ad0ac29a63a0c2d3878" } }, "cf177dc87cc24d0387d318e9837e74bd": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b4933533714f402ea0eb9b36c643cd23", "placeholder": "​", "style": "IPY_MODEL_3493b94aafea49ddbb444f34fdbb4d9d", "value": "tokenizer.json: 100%" } }, "11c83b5b7f044e9d86f2eb8e389859a6": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_513e6d0d29014fbf8b44cb3349d2f9c5", "max": 1355256, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_27135e7cdd4742de9e633a502f57b9e6", "value": 1355256 } }, "d2763d28508543bd88458615d791baca": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6fdc41a50cf84782ae212d99d8a6d4ac", "placeholder": "​", "style": "IPY_MODEL_044068911c104c0a9ee7a26da931b859", "value": " 1.36M/1.36M [00:00<00:00, 66.4MB/s]" } }, "73cc99094f184ad0ac29a63a0c2d3878": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "b4933533714f402ea0eb9b36c643cd23": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3493b94aafea49ddbb444f34fdbb4d9d": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "513e6d0d29014fbf8b44cb3349d2f9c5": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "27135e7cdd4742de9e633a502f57b9e6": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "6fdc41a50cf84782ae212d99d8a6d4ac": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "044068911c104c0a9ee7a26da931b859": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "8343f9ada7d84533837d35815dd900b6": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_1badf7e1789f44c994abd5792be7f5af", "IPY_MODEL_160a679f3e5a408f9998719014586718", "IPY_MODEL_5e73b02c77af47bab7741d4a1210029c" ], "layout": "IPY_MODEL_484a8d2a3a9a48199d6ead11e4b2ab4f" } }, "1badf7e1789f44c994abd5792be7f5af": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b179464f498e456a9df7c01b51acd50c", "placeholder": "​", "style": "IPY_MODEL_e6c89d946ccb49b3b10088b15d0281bd", "value": "model.safetensors: 100%" } }, "160a679f3e5a408f9998719014586718": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e7314d38ce9645e0bc6a865b8c4ccff7", "max": 3247159078, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_f2561e8cb3df4396a6ee53c0aed197d5", "value": 3247159078 } }, "5e73b02c77af47bab7741d4a1210029c": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9480c9b5ecf243608ca72c5c50f22654", "placeholder": "​", "style": "IPY_MODEL_12f6200bdad84b5a813d3cb2fe6cc362", "value": " 3.25G/3.25G [00:09<00:00, 331MB/s]" } }, "484a8d2a3a9a48199d6ead11e4b2ab4f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "b179464f498e456a9df7c01b51acd50c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e6c89d946ccb49b3b10088b15d0281bd": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "e7314d38ce9645e0bc6a865b8c4ccff7": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "f2561e8cb3df4396a6ee53c0aed197d5": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "9480c9b5ecf243608ca72c5c50f22654": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "12f6200bdad84b5a813d3cb2fe6cc362": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a9326eb1d78e4336b5efd65a4c58d48f": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_e9048f89827441928b873e49b9685f5b", "IPY_MODEL_60832605ca9b47ad830d79ab4c4f9a85", "IPY_MODEL_ad9fa65d10384c55a683dd9d99561f67" ], "layout": "IPY_MODEL_bd65929a088747b29df95b2270b951ef" } }, "e9048f89827441928b873e49b9685f5b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_67c75ec25a9041abb64278608cdfc861", "placeholder": "​", "style": "IPY_MODEL_3281ac115abd43f385f6f1dbe218325c", "value": "generation_config.json: 100%" } }, "60832605ca9b47ad830d79ab4c4f9a85": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4461fe464d65443b921a8a7c71731a28", "max": 124, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_e6b693c0fed24b10aec8995a185a7455", "value": 124 } }, "ad9fa65d10384c55a683dd9d99561f67": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4b924f7948a34b40a7ce25025528ee1b", "placeholder": "​", "style": "IPY_MODEL_d9ec340661874a6e9d3117f7234fbe19", "value": " 124/124 [00:00<00:00, 10.2kB/s]" } }, "bd65929a088747b29df95b2270b951ef": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "67c75ec25a9041abb64278608cdfc861": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3281ac115abd43f385f6f1dbe218325c": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "4461fe464d65443b921a8a7c71731a28": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e6b693c0fed24b10aec8995a185a7455": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "4b924f7948a34b40a7ce25025528ee1b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d9ec340661874a6e9d3117f7234fbe19": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } }, "accelerator": "GPU" }, "cells": [ { "cell_type": "code", "source": [ "!unzip train_data.zip" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "VRqtDwq0_i9x", "outputId": "856702f4-4491-461d-e56c-92b65944cb35" }, "execution_count": 2, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Archive: train_data.rar\n", " End-of-central-directory signature not found. Either this file is not\n", " a zipfile, or it constitutes one disk of a multi-part archive. In the\n", " latter case the central directory and zipfile comment will be found on\n", " the last disk(s) of this archive.\n", "unzip: cannot find zipfile directory in one of train_data.rar or\n", " train_data.rar.zip, and cannot find train_data.rar.ZIP, period.\n" ] } ] }, { "cell_type": "code", "source": [ "!pip install peft datasets transformers[torch] accelerate -q" ], "metadata": { "id": "Shijw55Hhpnc", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "a92efdb0-6c6c-49a5-d116-a066f203fe99" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/190.9 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.9/190.9 kB\u001b[0m \u001b[31m5.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/510.5 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m510.5/510.5 kB\u001b[0m \u001b[31m32.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m280.0/280.0 kB\u001b[0m \u001b[31m34.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m19.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m18.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h" ] } ] }, { "cell_type": "code", "source": [ "import os\n", "import torch\n", "import pathlib\n", "import pandas as pd\n", "from IPython.display import clear_output" ], "metadata": { "id": "ynbp4mfyFkjU" }, "execution_count": 4, "outputs": [] }, { "cell_type": "code", "source": [ "ROOT_DIR = os.path.abspath(os.getcwd())\n", "ROOT_DIR" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 36 }, "id": "Segh-5MjFzLJ", "outputId": "f5685df7-9384-469d-a070-fdb656a44412" }, "execution_count": 5, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "'/content'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 5 } ] }, { "cell_type": "markdown", "source": [ "По факту можно написать" ], "metadata": { "id": "VvS6ovZUKWFH" } }, { "cell_type": "code", "source": [ "CHARACTER = \"rachel\"\n", "model_type = \"gpt2-large\" # 'gpt2', 'gpt2-medium', 'gpt2-large'" ], "metadata": { "id": "kIRqGDy3KQBO" }, "execution_count": 6, "outputs": [] }, { "cell_type": "code", "source": [ "from transformers import AutoTokenizer\n", "from transformers import pipeline\n", "from transformers import TextDataset, DataCollatorForLanguageModeling\n", "from transformers import Trainer, TrainingArguments,AutoModelWithLMHead" ], "metadata": { "id": "_ZZbK_z8LmEB" }, "execution_count": 7, "outputs": [] }, { "cell_type": "markdown", "source": [ "Training on monologues" ], "metadata": { "id": "NBJMq1rZL-tN" } }, { "cell_type": "code", "source": [ "tokenizer = AutoTokenizer.from_pretrained(model_type)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 286, "referenced_widgets": [ "fb2393ca9dd245a6aa277e1cc31db03b", "f948bb92d53f4cb080b36c7b6dfe95cf", "cb31c9997f7f4c629db5c304986d505e", "6cf67a0118df4c0a9064baed0116dd07", "f3b00df2056a43d4bb4485fc18374a32", "d4e1625ab0bc4a75bb14a457e1fffc2b", "eb6e36a9ad5f4e7c9ba923ea38da03f6", "8131735faf234d80b6aa448ce871fff6", "bbe035370c064c41beca92e54ff4b82a", "f3dc11d89e474bd6a683b8f6406c652d", "1a2803e4504a4c9ba0c27ae02e02416e", "24291aa0933a450ab056fbdc926e3d55", "c1aaba1b6c8748aeb3c9463804f654f1", "06ebbf05e8b141cb8f62777f9bc0eac0", "f5562a8ce84a47698c6ea86dbff2874b", "5e9744f1e20e462f98515fd590636817", "0e286fa5c7c240c49a6bdd596175b2b5", "8394c69a136b450eac324e55eda462b0", "89661f4ab03e4236980d012fb916b8b1", "1b28439538044b51bf48bbce7588492c", "2a341ff92a09496db4f4674dab691d5f", "75e619fafd424abd80ac02a284e93260", "cdb6fe00e4c24a03b51d291f8f3ba79b", "0256c1d5581643f4a3ce2a8bc8e9004c", "5976b3abbcb240d38e871b52f9285839", "b8b157535f824bc684602cc333b00c63", "676df78144394dc3b331c7438295f20e", "a9adbbd4f7df4cb7aba88618800ca9f1", "3947c6b5b3414745a3534628b24c0eb8", "f960228546324c87a59846c0e764a6f3", "15c5d725ded246009f6d5aef65cb7533", "d756fabb8b7d4ff2b5855d58a5ba3929", "4a27186407f14bd98df85422f6c86c21", "f8e52609a94b4c94b9eac92b86228f48", "2cfabbfe73164eafb939090b43bc197b", "4e2b693b5255430eb2fdd177485a9bba", "be133213af3e40adbe56df950f70e21f", "86f383cb0293497aab584ee35ffe1b19", "cf3dee2789bd43c391c1d17eaa5eb0af", "ae783df0495841de974e12357c15fbe9", "2830d535c34e4e209ce9a0db1925ed3d", "27a857844bea40d883975cee7b244f9a", "1e4e6c854cc4473aa8c8deb88a24cf87", "dacdf48c3fd443ac863ea92fcf3dea10", "4d77313b684c4841b166c57acca822ed", "cf177dc87cc24d0387d318e9837e74bd", "11c83b5b7f044e9d86f2eb8e389859a6", "d2763d28508543bd88458615d791baca", "73cc99094f184ad0ac29a63a0c2d3878", "b4933533714f402ea0eb9b36c643cd23", "3493b94aafea49ddbb444f34fdbb4d9d", "513e6d0d29014fbf8b44cb3349d2f9c5", "27135e7cdd4742de9e633a502f57b9e6", "6fdc41a50cf84782ae212d99d8a6d4ac", "044068911c104c0a9ee7a26da931b859" ] }, "id": "xb3UH4QDMCn7", "outputId": "9dacffec-63da-4748-acf9-8997edfb4434" }, "execution_count": 8, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:88: UserWarning: \n", "The secret `HF_TOKEN` does not exist in your Colab secrets.\n", "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n", "You will be able to reuse this secret in all of your notebooks.\n", "Please note that authentication is recommended but still optional to access public models or datasets.\n", " warnings.warn(\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ "tokenizer_config.json: 0%| | 0.00/26.0 [00:00 1024). Running this sequence through the model will result in indexing errors\n" ] } ] }, { "cell_type": "code", "source": [ "!mkdir ./models" ], "metadata": { "id": "rWmnGJzsVTV4" }, "execution_count": 12, "outputs": [] }, { "cell_type": "code", "source": [ "model = AutoModelWithLMHead.from_pretrained(model_type)\n", "output_folder = f\"./models/en_{model_type}_{CHARACTER}_mono\"" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 137, "referenced_widgets": [ "8343f9ada7d84533837d35815dd900b6", "1badf7e1789f44c994abd5792be7f5af", "160a679f3e5a408f9998719014586718", "5e73b02c77af47bab7741d4a1210029c", "484a8d2a3a9a48199d6ead11e4b2ab4f", "b179464f498e456a9df7c01b51acd50c", "e6c89d946ccb49b3b10088b15d0281bd", "e7314d38ce9645e0bc6a865b8c4ccff7", "f2561e8cb3df4396a6ee53c0aed197d5", "9480c9b5ecf243608ca72c5c50f22654", "12f6200bdad84b5a813d3cb2fe6cc362", "a9326eb1d78e4336b5efd65a4c58d48f", "e9048f89827441928b873e49b9685f5b", "60832605ca9b47ad830d79ab4c4f9a85", "ad9fa65d10384c55a683dd9d99561f67", "bd65929a088747b29df95b2270b951ef", "67c75ec25a9041abb64278608cdfc861", "3281ac115abd43f385f6f1dbe218325c", "4461fe464d65443b921a8a7c71731a28", "e6b693c0fed24b10aec8995a185a7455", "4b924f7948a34b40a7ce25025528ee1b", "d9ec340661874a6e9d3117f7234fbe19" ] }, "id": "SagaGDCBQNEl", "outputId": "20b6cef5-2ac1-4fc7-f822-cfeece689129" }, "execution_count": 13, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "/usr/local/lib/python3.10/dist-packages/transformers/models/auto/modeling_auto.py:1595: FutureWarning: The class `AutoModelWithLMHead` is deprecated and will be removed in a future version. Please use `AutoModelForCausalLM` for causal language models, `AutoModelForMaskedLM` for masked language models and `AutoModelForSeq2SeqLM` for encoder-decoder models.\n", " warnings.warn(\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ "model.safetensors: 0%| | 0.00/3.25G [00:00" ], "text/html": [ "\n", "
\n", " \n", " \n", " [1320/1320 12:32, Epoch 5/5]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining LossValidation Loss
200No log1.390404
400No log1.377137
6001.3985001.380381
8001.3985001.380880
10001.2398001.387712
12001.2398001.397241

" ] }, "metadata": {} }, { "output_type": "stream", "name": "stderr", "text": [ "There were missing keys in the checkpoint model loaded: ['lm_head.weight'].\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "TrainOutput(global_step=1320, training_loss=1.2858209552186908, metrics={'train_runtime': 751.9269, 'train_samples_per_second': 14.051, 'train_steps_per_second': 1.755, 'total_flos': 5745102815232000.0, 'train_loss': 1.2858209552186908, 'epoch': 5.0})" ] }, "metadata": {}, "execution_count": 18 } ] }, { "cell_type": "code", "source": [ "trainer.save_model()" ], "metadata": { "id": "Hzb8Zm4zYJkc" }, "execution_count": 19, "outputs": [] }, { "cell_type": "code", "source": [ "# The name of the task to train.\n", "TASK_NAME = f\"{model_type}_mono_en_{CHARACTER}\"\n", "\n", "# The output directory where the fine-tuned model and checkpoints will be written.\n", "OUTPUT_DIR = f'{ROOT_DIR}/outputs/{TASK_NAME}/'\n", "pathlib.Path(OUTPUT_DIR).mkdir(parents=True, exist_ok=True)\n", "\n", "CONFIG_NAME = \"config.json\"\n", "WEIGHTS_NAME = f\"{TASK_NAME}_pytorch_model.bin\"" ], "metadata": { "id": "Kqbabg4afTjj" }, "execution_count": 20, "outputs": [] }, { "cell_type": "code", "source": [ "def saver(model, OUTPUT_DIR, WEIGHTS_NAME):\n", " model_to_save = model.module if hasattr(model, 'module') else model # Only save the model it-self\n", "\n", " # If we save using the predefined names, we can load using `from_pretrained`\n", " output_model_file = os.path.join(OUTPUT_DIR, WEIGHTS_NAME)\n", " output_config_file = os.path.join(OUTPUT_DIR, CONFIG_NAME)\n", "\n", " torch.save(model_to_save.state_dict(), output_model_file)\n", " model_to_save.config.to_json_file(output_config_file)\n", "\n", "saver(model, OUTPUT_DIR, WEIGHTS_NAME)" ], "metadata": { "id": "SYbsx5ltfv49" }, "execution_count": 21, "outputs": [] }, { "cell_type": "code", "source": [ "path_to_dialogs_data = './train_data/en/replics/'\n", "train_path = path_to_dialogs_data + f'train_{CHARACTER}_replics.txt'\n", "test_path = path_to_dialogs_data + f'valid_{CHARACTER}_replics.txt'\n", "train_path, test_path" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "dB7DqnX6kAdZ", "outputId": "23ee3d57-e363-49ea-a55c-bcc04be1bd0d" }, "execution_count": 22, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "('./train_data/en/replics/train_rachel_replics.txt',\n", " './train_data/en/replics/valid_rachel_replics.txt')" ] }, "metadata": {}, "execution_count": 22 } ] }, { "cell_type": "code", "source": [ "train_dataset, test_dataset, data_collator = load_dataset(train_path, test_path, tokenizer)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "LotVFrEFZun9", "outputId": "c75d2226-6a2d-4b5f-e1b9-6f769a4e517a" }, "execution_count": 23, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "/usr/local/lib/python3.10/dist-packages/transformers/data/datasets/language_modeling.py:53: FutureWarning: This dataset will be removed from the library soon, preprocessing should be handled with the 🤗 Datasets library. You can have a look at this example script for pointers: https://github.com/huggingface/transformers/blob/main/examples/pytorch/language-modeling/run_mlm.py\n", " warnings.warn(\n" ] } ] }, { "cell_type": "code", "source": [ "model = AutoModelWithLMHead.from_pretrained(output_folder)\n", "final_output_folder = f\"./models/en_{model_type}_{CHARACTER}_replics\"" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "AWJ7VKkbkJPL", "outputId": "b8c7b6ff-3022-42a2-d22c-a79f4ea676f1" }, "execution_count": 24, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "/usr/local/lib/python3.10/dist-packages/transformers/models/auto/modeling_auto.py:1595: FutureWarning: The class `AutoModelWithLMHead` is deprecated and will be removed in a future version. Please use `AutoModelForCausalLM` for causal language models, `AutoModelForMaskedLM` for masked language models and `AutoModelForSeq2SeqLM` for encoder-decoder models.\n", " warnings.warn(\n" ] } ] }, { "cell_type": "code", "source": [ "training_args = TrainingArguments(\n", " output_dir = final_output_folder,\n", " overwrite_output_dir=True, #overwrite the content of the output directory\n", " num_train_epochs=5, # number of training epochs\n", " learning_rate=0.00001, # learning rate\n", " lr_scheduler_type=\"linear\",\n", " per_device_train_batch_size=6, # batch size for training\n", " per_device_eval_batch_size=6, # batch size for evaluation\n", " eval_steps = 400, # number of update steps between two evaluations\n", " save_steps = 400, # after # steps model is saved\n", " save_strategy = \"steps\",\n", " evaluation_strategy = \"steps\",\n", " dataloader_drop_last=True, # avoid an error with an incomplete batch\n", " fp16=False,\n", " save_total_limit = 1, # Only last 5 models are saved. Older ones are deleted.\n", " load_best_model_at_end=True,\n", " )\n", "\n", "trainer = Trainer(\n", " model=model,\n", " args=training_args,\n", " data_collator=data_collator,\n", " train_dataset=train_dataset,\n", " eval_dataset=test_dataset,\n", ")" ], "metadata": { "id": "STJ1g8v-kRGD" }, "execution_count": 25, "outputs": [] }, { "cell_type": "code", "source": [ "trainer.train()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 237 }, "id": "Jig-B64qkjgC", "outputId": "6a62298c-ada3-4b2b-b97a-5bad131dcfa1" }, "execution_count": 26, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "text/html": [ "\n", "

\n", " \n", " \n", " [1990/1990 12:57, Epoch 5/5]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining LossValidation Loss
400No log1.924102
8001.9687001.920127
12001.7905001.930205
16001.6872001.949348

" ] }, "metadata": {} }, { "output_type": "stream", "name": "stderr", "text": [ "There were missing keys in the checkpoint model loaded: ['lm_head.weight'].\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "TrainOutput(global_step=1990, training_loss=1.7659926218004083, metrics={'train_runtime': 776.6032, 'train_samples_per_second': 15.381, 'train_steps_per_second': 2.562, 'total_flos': 6495883296768000.0, 'train_loss': 1.7659926218004083, 'epoch': 5.0})" ] }, "metadata": {}, "execution_count": 26 } ] }, { "cell_type": "code", "source": [ "trainer.save_model()" ], "metadata": { "id": "3bYMJeMdqEZN" }, "execution_count": 27, "outputs": [] }, { "cell_type": "code", "source": [ "# The name of the task to train.\n", "TASK_NAME = f'{model_type}_mono_replics_en_{CHARACTER}'\n", "\n", "# The output directory where the fine-tuned model and checkpoints will be written.\n", "OUTPUT_DIR = f'{ROOT_DIR}/outputs/{TASK_NAME}/'\n", "pathlib.Path(OUTPUT_DIR).mkdir(parents=True, exist_ok=True)\n", "\n", "CONFIG_NAME = \"config.json\"\n", "WEIGHTS_NAME = f\"{TASK_NAME}_pytorch_model.bin\"\n", "\n", "saver(model, OUTPUT_DIR, WEIGHTS_NAME)" ], "metadata": { "id": "b2K3lFaMkntr" }, "execution_count": 28, "outputs": [] }, { "cell_type": "code", "source": [ "chef = pipeline('text-generation', model=\"./models/en_gpt2-large_rachel_replics\", tokenizer=model_type)" ], "metadata": { "id": "Wv7iMsSCntjL" }, "execution_count": 30, "outputs": [] }, { "cell_type": "code", "source": [ "tmp = chef(f\"NOTFRIEND: Do you like Ross?\\nRACHEL:\")[0]['generated_text']\n", "tmp = tmp[tmp.find(f\"RACHEL: \") + len(\"RACHEL\") + 2 : tmp.find('')]\n", "tmp" ], "metadata": { "id": "-pfVaiGQhZh0" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "message1 = \"Hi, Rachel! How are you?\"\n", "message2 = \"Glad to hear it! Where are you going?\"" ], "metadata": { "id": "BvHVpTx9tGY2" }, "execution_count": 32, "outputs": [] }, { "cell_type": "code", "source": [ "tmp = chef(f\"NOTFRIEND: {message1}\\nRACHEL:\")[0]['generated_text']" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "QD2AcGJAXpao", "outputId": "a0055cf7-b9c0-4b59-8294-9a8b74ef4462" }, "execution_count": 44, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.\n" ] } ] }, { "cell_type": "code", "source": [ "tmp = tmp[tmp.find(f\"RACHEL: \") + len(\"RACHEL\") + 2 : tmp.find('')]\n", "tmp" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 36 }, "id": "bRa5FDNzXxZq", "outputId": "0678e5da-42c1-4ffa-cb1a-8163bab9f6eb" }, "execution_count": 45, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "'Oh, it’s not bad, it’s like, perfect. I’m sorry, I know we should be togethe'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 45 } ] }, { "cell_type": "code", "source": [ "message1 = \"Hi, Rachel! How are you?\"\n", "text = f\"NOTFRIEND: {message1}\\nRACHEL:\"\n", "inpt = tokenizer.encode(text, return_tensors=\"pt\")" ], "metadata": { "id": "b35Ylb9_YmnS" }, "execution_count": 64, "outputs": [] }, { "cell_type": "code", "source": [ "out = model.generate(inpt.cuda(),\n", " max_length=50,\n", " repetition_penalty=5.0,\n", " do_sample=True,\n", " top_k=5,\n", " top_p=0.95,\n", " temperature=1)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "A1920Yb1ahIt", "outputId": "1786c240-8a88-41d4-c8a2-3b74e08e8e09" }, "execution_count": 65, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "The attention mask and the pad token id were not set. As a consequence, you may observe unexpected behavior. Please pass your input's `attention_mask` to obtain reliable results.\n", "Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.\n" ] } ] }, { "cell_type": "code", "source": [ "generated_text = tokenizer.decode(out[0])\n", "generated_text = generated_text[generated_text.find(f\"RACHEL: \") + len(\"RACHEL\") + 2 : generated_text.find('')]" ], "metadata": { "id": "nic2z2A3a1FP" }, "execution_count": 67, "outputs": [] }, { "cell_type": "code", "source": [ "log_msg = \"Model generates reply {} for {}\".format(generated_text, message1)\n", "log_msg" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 36 }, "id": "70xEEO6pbXwA", "outputId": "ec688f61-4531-4570-891b-73417936b31c" }, "execution_count": 68, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "\"Model generates reply Oh God. I'm good. for Hi, Rachel! How are you?\"" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 68 } ] } ] }