joshcarp commited on
Commit
c00d619
1 Parent(s): c95869e

Upload gpt2_evy.ipynb

Browse files
Files changed (1) hide show
  1. gpt2_evy.ipynb +2257 -0
gpt2_evy.ipynb ADDED
@@ -0,0 +1,2257 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "provenance": [],
7
+ "gpuType": "A100",
8
+ "machine_shape": "hm"
9
+ },
10
+ "kernelspec": {
11
+ "name": "python3",
12
+ "display_name": "Python 3"
13
+ },
14
+ "language_info": {
15
+ "name": "python"
16
+ },
17
+ "accelerator": "GPU",
18
+ "widgets": {
19
+ "application/vnd.jupyter.widget-state+json": {
20
+ "a268227e95cc46cda6c40f88f76729b4": {
21
+ "model_module": "@jupyter-widgets/controls",
22
+ "model_name": "VBoxModel",
23
+ "model_module_version": "1.5.0",
24
+ "state": {
25
+ "_dom_classes": [],
26
+ "_model_module": "@jupyter-widgets/controls",
27
+ "_model_module_version": "1.5.0",
28
+ "_model_name": "VBoxModel",
29
+ "_view_count": null,
30
+ "_view_module": "@jupyter-widgets/controls",
31
+ "_view_module_version": "1.5.0",
32
+ "_view_name": "VBoxView",
33
+ "box_style": "",
34
+ "children": [
35
+ "IPY_MODEL_8d2fc30851ab4972a0fc9763f81ed088",
36
+ "IPY_MODEL_6c9471e6455a4245a9fa731ef480041d",
37
+ "IPY_MODEL_e04732f9aee643378919f97ceed29a79",
38
+ "IPY_MODEL_865a67dd6e0c4b779a6bb41a8bd06882"
39
+ ],
40
+ "layout": "IPY_MODEL_c3b6d6efc0bb4cebb43e54f1cac15398"
41
+ }
42
+ },
43
+ "5d2b151866db434b9a97054136972c02": {
44
+ "model_module": "@jupyter-widgets/controls",
45
+ "model_name": "HTMLModel",
46
+ "model_module_version": "1.5.0",
47
+ "state": {
48
+ "_dom_classes": [],
49
+ "_model_module": "@jupyter-widgets/controls",
50
+ "_model_module_version": "1.5.0",
51
+ "_model_name": "HTMLModel",
52
+ "_view_count": null,
53
+ "_view_module": "@jupyter-widgets/controls",
54
+ "_view_module_version": "1.5.0",
55
+ "_view_name": "HTMLView",
56
+ "description": "",
57
+ "description_tooltip": null,
58
+ "layout": "IPY_MODEL_dfb07bd69a98467385a922d93dbbdf78",
59
+ "placeholder": "​",
60
+ "style": "IPY_MODEL_b8c97b05b8cd41929982d3dfa4c0253e",
61
+ "value": "<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.svg\nalt='Hugging Face'> <br> Copy a token from <a\nhref=\"https://huggingface.co/settings/tokens\" target=\"_blank\">your Hugging Face\ntokens page</a> and paste it below. <br> Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file. </center>"
62
+ }
63
+ },
64
+ "26e2d737d2334bfaab84d7567957f98f": {
65
+ "model_module": "@jupyter-widgets/controls",
66
+ "model_name": "PasswordModel",
67
+ "model_module_version": "1.5.0",
68
+ "state": {
69
+ "_dom_classes": [],
70
+ "_model_module": "@jupyter-widgets/controls",
71
+ "_model_module_version": "1.5.0",
72
+ "_model_name": "PasswordModel",
73
+ "_view_count": null,
74
+ "_view_module": "@jupyter-widgets/controls",
75
+ "_view_module_version": "1.5.0",
76
+ "_view_name": "PasswordView",
77
+ "continuous_update": true,
78
+ "description": "Token:",
79
+ "description_tooltip": null,
80
+ "disabled": false,
81
+ "layout": "IPY_MODEL_c14e7006466f465495524c631cb47296",
82
+ "placeholder": "​",
83
+ "style": "IPY_MODEL_49eef402a9aa41c09b515ccd03b1ded4",
84
+ "value": ""
85
+ }
86
+ },
87
+ "f65f24dbbc8e43ddb98f786c70412088": {
88
+ "model_module": "@jupyter-widgets/controls",
89
+ "model_name": "CheckboxModel",
90
+ "model_module_version": "1.5.0",
91
+ "state": {
92
+ "_dom_classes": [],
93
+ "_model_module": "@jupyter-widgets/controls",
94
+ "_model_module_version": "1.5.0",
95
+ "_model_name": "CheckboxModel",
96
+ "_view_count": null,
97
+ "_view_module": "@jupyter-widgets/controls",
98
+ "_view_module_version": "1.5.0",
99
+ "_view_name": "CheckboxView",
100
+ "description": "Add token as git credential?",
101
+ "description_tooltip": null,
102
+ "disabled": false,
103
+ "indent": true,
104
+ "layout": "IPY_MODEL_3af71b9541134fe9a62c1c3fe594062b",
105
+ "style": "IPY_MODEL_aebc8baf9fc442bb86a849886c94eebd",
106
+ "value": true
107
+ }
108
+ },
109
+ "92abf62190e543a8bcf5cd497fb0594e": {
110
+ "model_module": "@jupyter-widgets/controls",
111
+ "model_name": "ButtonModel",
112
+ "model_module_version": "1.5.0",
113
+ "state": {
114
+ "_dom_classes": [],
115
+ "_model_module": "@jupyter-widgets/controls",
116
+ "_model_module_version": "1.5.0",
117
+ "_model_name": "ButtonModel",
118
+ "_view_count": null,
119
+ "_view_module": "@jupyter-widgets/controls",
120
+ "_view_module_version": "1.5.0",
121
+ "_view_name": "ButtonView",
122
+ "button_style": "",
123
+ "description": "Login",
124
+ "disabled": false,
125
+ "icon": "",
126
+ "layout": "IPY_MODEL_16c2e8011f0f45808960ab2b8bd53443",
127
+ "style": "IPY_MODEL_7bb44167e92e4d73ac5ea1ced3d08110",
128
+ "tooltip": ""
129
+ }
130
+ },
131
+ "3d9f52d2c3294ca4a83d91987387ff8c": {
132
+ "model_module": "@jupyter-widgets/controls",
133
+ "model_name": "HTMLModel",
134
+ "model_module_version": "1.5.0",
135
+ "state": {
136
+ "_dom_classes": [],
137
+ "_model_module": "@jupyter-widgets/controls",
138
+ "_model_module_version": "1.5.0",
139
+ "_model_name": "HTMLModel",
140
+ "_view_count": null,
141
+ "_view_module": "@jupyter-widgets/controls",
142
+ "_view_module_version": "1.5.0",
143
+ "_view_name": "HTMLView",
144
+ "description": "",
145
+ "description_tooltip": null,
146
+ "layout": "IPY_MODEL_ebefb66192ce436cb6bdc2f6e889479c",
147
+ "placeholder": "​",
148
+ "style": "IPY_MODEL_ce227eacf424429899de05839c6a09b4",
149
+ "value": "\n<b>Pro Tip:</b> If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks. </center>"
150
+ }
151
+ },
152
+ "c3b6d6efc0bb4cebb43e54f1cac15398": {
153
+ "model_module": "@jupyter-widgets/base",
154
+ "model_name": "LayoutModel",
155
+ "model_module_version": "1.2.0",
156
+ "state": {
157
+ "_model_module": "@jupyter-widgets/base",
158
+ "_model_module_version": "1.2.0",
159
+ "_model_name": "LayoutModel",
160
+ "_view_count": null,
161
+ "_view_module": "@jupyter-widgets/base",
162
+ "_view_module_version": "1.2.0",
163
+ "_view_name": "LayoutView",
164
+ "align_content": null,
165
+ "align_items": "center",
166
+ "align_self": null,
167
+ "border": null,
168
+ "bottom": null,
169
+ "display": "flex",
170
+ "flex": null,
171
+ "flex_flow": "column",
172
+ "grid_area": null,
173
+ "grid_auto_columns": null,
174
+ "grid_auto_flow": null,
175
+ "grid_auto_rows": null,
176
+ "grid_column": null,
177
+ "grid_gap": null,
178
+ "grid_row": null,
179
+ "grid_template_areas": null,
180
+ "grid_template_columns": null,
181
+ "grid_template_rows": null,
182
+ "height": null,
183
+ "justify_content": null,
184
+ "justify_items": null,
185
+ "left": null,
186
+ "margin": null,
187
+ "max_height": null,
188
+ "max_width": null,
189
+ "min_height": null,
190
+ "min_width": null,
191
+ "object_fit": null,
192
+ "object_position": null,
193
+ "order": null,
194
+ "overflow": null,
195
+ "overflow_x": null,
196
+ "overflow_y": null,
197
+ "padding": null,
198
+ "right": null,
199
+ "top": null,
200
+ "visibility": null,
201
+ "width": "50%"
202
+ }
203
+ },
204
+ "dfb07bd69a98467385a922d93dbbdf78": {
205
+ "model_module": "@jupyter-widgets/base",
206
+ "model_name": "LayoutModel",
207
+ "model_module_version": "1.2.0",
208
+ "state": {
209
+ "_model_module": "@jupyter-widgets/base",
210
+ "_model_module_version": "1.2.0",
211
+ "_model_name": "LayoutModel",
212
+ "_view_count": null,
213
+ "_view_module": "@jupyter-widgets/base",
214
+ "_view_module_version": "1.2.0",
215
+ "_view_name": "LayoutView",
216
+ "align_content": null,
217
+ "align_items": null,
218
+ "align_self": null,
219
+ "border": null,
220
+ "bottom": null,
221
+ "display": null,
222
+ "flex": null,
223
+ "flex_flow": null,
224
+ "grid_area": null,
225
+ "grid_auto_columns": null,
226
+ "grid_auto_flow": null,
227
+ "grid_auto_rows": null,
228
+ "grid_column": null,
229
+ "grid_gap": null,
230
+ "grid_row": null,
231
+ "grid_template_areas": null,
232
+ "grid_template_columns": null,
233
+ "grid_template_rows": null,
234
+ "height": null,
235
+ "justify_content": null,
236
+ "justify_items": null,
237
+ "left": null,
238
+ "margin": null,
239
+ "max_height": null,
240
+ "max_width": null,
241
+ "min_height": null,
242
+ "min_width": null,
243
+ "object_fit": null,
244
+ "object_position": null,
245
+ "order": null,
246
+ "overflow": null,
247
+ "overflow_x": null,
248
+ "overflow_y": null,
249
+ "padding": null,
250
+ "right": null,
251
+ "top": null,
252
+ "visibility": null,
253
+ "width": null
254
+ }
255
+ },
256
+ "b8c97b05b8cd41929982d3dfa4c0253e": {
257
+ "model_module": "@jupyter-widgets/controls",
258
+ "model_name": "DescriptionStyleModel",
259
+ "model_module_version": "1.5.0",
260
+ "state": {
261
+ "_model_module": "@jupyter-widgets/controls",
262
+ "_model_module_version": "1.5.0",
263
+ "_model_name": "DescriptionStyleModel",
264
+ "_view_count": null,
265
+ "_view_module": "@jupyter-widgets/base",
266
+ "_view_module_version": "1.2.0",
267
+ "_view_name": "StyleView",
268
+ "description_width": ""
269
+ }
270
+ },
271
+ "c14e7006466f465495524c631cb47296": {
272
+ "model_module": "@jupyter-widgets/base",
273
+ "model_name": "LayoutModel",
274
+ "model_module_version": "1.2.0",
275
+ "state": {
276
+ "_model_module": "@jupyter-widgets/base",
277
+ "_model_module_version": "1.2.0",
278
+ "_model_name": "LayoutModel",
279
+ "_view_count": null,
280
+ "_view_module": "@jupyter-widgets/base",
281
+ "_view_module_version": "1.2.0",
282
+ "_view_name": "LayoutView",
283
+ "align_content": null,
284
+ "align_items": null,
285
+ "align_self": null,
286
+ "border": null,
287
+ "bottom": null,
288
+ "display": null,
289
+ "flex": null,
290
+ "flex_flow": null,
291
+ "grid_area": null,
292
+ "grid_auto_columns": null,
293
+ "grid_auto_flow": null,
294
+ "grid_auto_rows": null,
295
+ "grid_column": null,
296
+ "grid_gap": null,
297
+ "grid_row": null,
298
+ "grid_template_areas": null,
299
+ "grid_template_columns": null,
300
+ "grid_template_rows": null,
301
+ "height": null,
302
+ "justify_content": null,
303
+ "justify_items": null,
304
+ "left": null,
305
+ "margin": null,
306
+ "max_height": null,
307
+ "max_width": null,
308
+ "min_height": null,
309
+ "min_width": null,
310
+ "object_fit": null,
311
+ "object_position": null,
312
+ "order": null,
313
+ "overflow": null,
314
+ "overflow_x": null,
315
+ "overflow_y": null,
316
+ "padding": null,
317
+ "right": null,
318
+ "top": null,
319
+ "visibility": null,
320
+ "width": null
321
+ }
322
+ },
323
+ "49eef402a9aa41c09b515ccd03b1ded4": {
324
+ "model_module": "@jupyter-widgets/controls",
325
+ "model_name": "DescriptionStyleModel",
326
+ "model_module_version": "1.5.0",
327
+ "state": {
328
+ "_model_module": "@jupyter-widgets/controls",
329
+ "_model_module_version": "1.5.0",
330
+ "_model_name": "DescriptionStyleModel",
331
+ "_view_count": null,
332
+ "_view_module": "@jupyter-widgets/base",
333
+ "_view_module_version": "1.2.0",
334
+ "_view_name": "StyleView",
335
+ "description_width": ""
336
+ }
337
+ },
338
+ "3af71b9541134fe9a62c1c3fe594062b": {
339
+ "model_module": "@jupyter-widgets/base",
340
+ "model_name": "LayoutModel",
341
+ "model_module_version": "1.2.0",
342
+ "state": {
343
+ "_model_module": "@jupyter-widgets/base",
344
+ "_model_module_version": "1.2.0",
345
+ "_model_name": "LayoutModel",
346
+ "_view_count": null,
347
+ "_view_module": "@jupyter-widgets/base",
348
+ "_view_module_version": "1.2.0",
349
+ "_view_name": "LayoutView",
350
+ "align_content": null,
351
+ "align_items": null,
352
+ "align_self": null,
353
+ "border": null,
354
+ "bottom": null,
355
+ "display": null,
356
+ "flex": null,
357
+ "flex_flow": null,
358
+ "grid_area": null,
359
+ "grid_auto_columns": null,
360
+ "grid_auto_flow": null,
361
+ "grid_auto_rows": null,
362
+ "grid_column": null,
363
+ "grid_gap": null,
364
+ "grid_row": null,
365
+ "grid_template_areas": null,
366
+ "grid_template_columns": null,
367
+ "grid_template_rows": null,
368
+ "height": null,
369
+ "justify_content": null,
370
+ "justify_items": null,
371
+ "left": null,
372
+ "margin": null,
373
+ "max_height": null,
374
+ "max_width": null,
375
+ "min_height": null,
376
+ "min_width": null,
377
+ "object_fit": null,
378
+ "object_position": null,
379
+ "order": null,
380
+ "overflow": null,
381
+ "overflow_x": null,
382
+ "overflow_y": null,
383
+ "padding": null,
384
+ "right": null,
385
+ "top": null,
386
+ "visibility": null,
387
+ "width": null
388
+ }
389
+ },
390
+ "aebc8baf9fc442bb86a849886c94eebd": {
391
+ "model_module": "@jupyter-widgets/controls",
392
+ "model_name": "DescriptionStyleModel",
393
+ "model_module_version": "1.5.0",
394
+ "state": {
395
+ "_model_module": "@jupyter-widgets/controls",
396
+ "_model_module_version": "1.5.0",
397
+ "_model_name": "DescriptionStyleModel",
398
+ "_view_count": null,
399
+ "_view_module": "@jupyter-widgets/base",
400
+ "_view_module_version": "1.2.0",
401
+ "_view_name": "StyleView",
402
+ "description_width": ""
403
+ }
404
+ },
405
+ "16c2e8011f0f45808960ab2b8bd53443": {
406
+ "model_module": "@jupyter-widgets/base",
407
+ "model_name": "LayoutModel",
408
+ "model_module_version": "1.2.0",
409
+ "state": {
410
+ "_model_module": "@jupyter-widgets/base",
411
+ "_model_module_version": "1.2.0",
412
+ "_model_name": "LayoutModel",
413
+ "_view_count": null,
414
+ "_view_module": "@jupyter-widgets/base",
415
+ "_view_module_version": "1.2.0",
416
+ "_view_name": "LayoutView",
417
+ "align_content": null,
418
+ "align_items": null,
419
+ "align_self": null,
420
+ "border": null,
421
+ "bottom": null,
422
+ "display": null,
423
+ "flex": null,
424
+ "flex_flow": null,
425
+ "grid_area": null,
426
+ "grid_auto_columns": null,
427
+ "grid_auto_flow": null,
428
+ "grid_auto_rows": null,
429
+ "grid_column": null,
430
+ "grid_gap": null,
431
+ "grid_row": null,
432
+ "grid_template_areas": null,
433
+ "grid_template_columns": null,
434
+ "grid_template_rows": null,
435
+ "height": null,
436
+ "justify_content": null,
437
+ "justify_items": null,
438
+ "left": null,
439
+ "margin": null,
440
+ "max_height": null,
441
+ "max_width": null,
442
+ "min_height": null,
443
+ "min_width": null,
444
+ "object_fit": null,
445
+ "object_position": null,
446
+ "order": null,
447
+ "overflow": null,
448
+ "overflow_x": null,
449
+ "overflow_y": null,
450
+ "padding": null,
451
+ "right": null,
452
+ "top": null,
453
+ "visibility": null,
454
+ "width": null
455
+ }
456
+ },
457
+ "7bb44167e92e4d73ac5ea1ced3d08110": {
458
+ "model_module": "@jupyter-widgets/controls",
459
+ "model_name": "ButtonStyleModel",
460
+ "model_module_version": "1.5.0",
461
+ "state": {
462
+ "_model_module": "@jupyter-widgets/controls",
463
+ "_model_module_version": "1.5.0",
464
+ "_model_name": "ButtonStyleModel",
465
+ "_view_count": null,
466
+ "_view_module": "@jupyter-widgets/base",
467
+ "_view_module_version": "1.2.0",
468
+ "_view_name": "StyleView",
469
+ "button_color": null,
470
+ "font_weight": ""
471
+ }
472
+ },
473
+ "ebefb66192ce436cb6bdc2f6e889479c": {
474
+ "model_module": "@jupyter-widgets/base",
475
+ "model_name": "LayoutModel",
476
+ "model_module_version": "1.2.0",
477
+ "state": {
478
+ "_model_module": "@jupyter-widgets/base",
479
+ "_model_module_version": "1.2.0",
480
+ "_model_name": "LayoutModel",
481
+ "_view_count": null,
482
+ "_view_module": "@jupyter-widgets/base",
483
+ "_view_module_version": "1.2.0",
484
+ "_view_name": "LayoutView",
485
+ "align_content": null,
486
+ "align_items": null,
487
+ "align_self": null,
488
+ "border": null,
489
+ "bottom": null,
490
+ "display": null,
491
+ "flex": null,
492
+ "flex_flow": null,
493
+ "grid_area": null,
494
+ "grid_auto_columns": null,
495
+ "grid_auto_flow": null,
496
+ "grid_auto_rows": null,
497
+ "grid_column": null,
498
+ "grid_gap": null,
499
+ "grid_row": null,
500
+ "grid_template_areas": null,
501
+ "grid_template_columns": null,
502
+ "grid_template_rows": null,
503
+ "height": null,
504
+ "justify_content": null,
505
+ "justify_items": null,
506
+ "left": null,
507
+ "margin": null,
508
+ "max_height": null,
509
+ "max_width": null,
510
+ "min_height": null,
511
+ "min_width": null,
512
+ "object_fit": null,
513
+ "object_position": null,
514
+ "order": null,
515
+ "overflow": null,
516
+ "overflow_x": null,
517
+ "overflow_y": null,
518
+ "padding": null,
519
+ "right": null,
520
+ "top": null,
521
+ "visibility": null,
522
+ "width": null
523
+ }
524
+ },
525
+ "ce227eacf424429899de05839c6a09b4": {
526
+ "model_module": "@jupyter-widgets/controls",
527
+ "model_name": "DescriptionStyleModel",
528
+ "model_module_version": "1.5.0",
529
+ "state": {
530
+ "_model_module": "@jupyter-widgets/controls",
531
+ "_model_module_version": "1.5.0",
532
+ "_model_name": "DescriptionStyleModel",
533
+ "_view_count": null,
534
+ "_view_module": "@jupyter-widgets/base",
535
+ "_view_module_version": "1.2.0",
536
+ "_view_name": "StyleView",
537
+ "description_width": ""
538
+ }
539
+ },
540
+ "f453dda624134aaeb5aaa68280b16a14": {
541
+ "model_module": "@jupyter-widgets/controls",
542
+ "model_name": "LabelModel",
543
+ "model_module_version": "1.5.0",
544
+ "state": {
545
+ "_dom_classes": [],
546
+ "_model_module": "@jupyter-widgets/controls",
547
+ "_model_module_version": "1.5.0",
548
+ "_model_name": "LabelModel",
549
+ "_view_count": null,
550
+ "_view_module": "@jupyter-widgets/controls",
551
+ "_view_module_version": "1.5.0",
552
+ "_view_name": "LabelView",
553
+ "description": "",
554
+ "description_tooltip": null,
555
+ "layout": "IPY_MODEL_08187be630cf4f3c914cabcc2aec20dd",
556
+ "placeholder": "​",
557
+ "style": "IPY_MODEL_06ca0c50c53c4d4da485ff88bf94299b",
558
+ "value": "Connecting..."
559
+ }
560
+ },
561
+ "08187be630cf4f3c914cabcc2aec20dd": {
562
+ "model_module": "@jupyter-widgets/base",
563
+ "model_name": "LayoutModel",
564
+ "model_module_version": "1.2.0",
565
+ "state": {
566
+ "_model_module": "@jupyter-widgets/base",
567
+ "_model_module_version": "1.2.0",
568
+ "_model_name": "LayoutModel",
569
+ "_view_count": null,
570
+ "_view_module": "@jupyter-widgets/base",
571
+ "_view_module_version": "1.2.0",
572
+ "_view_name": "LayoutView",
573
+ "align_content": null,
574
+ "align_items": null,
575
+ "align_self": null,
576
+ "border": null,
577
+ "bottom": null,
578
+ "display": null,
579
+ "flex": null,
580
+ "flex_flow": null,
581
+ "grid_area": null,
582
+ "grid_auto_columns": null,
583
+ "grid_auto_flow": null,
584
+ "grid_auto_rows": null,
585
+ "grid_column": null,
586
+ "grid_gap": null,
587
+ "grid_row": null,
588
+ "grid_template_areas": null,
589
+ "grid_template_columns": null,
590
+ "grid_template_rows": null,
591
+ "height": null,
592
+ "justify_content": null,
593
+ "justify_items": null,
594
+ "left": null,
595
+ "margin": null,
596
+ "max_height": null,
597
+ "max_width": null,
598
+ "min_height": null,
599
+ "min_width": null,
600
+ "object_fit": null,
601
+ "object_position": null,
602
+ "order": null,
603
+ "overflow": null,
604
+ "overflow_x": null,
605
+ "overflow_y": null,
606
+ "padding": null,
607
+ "right": null,
608
+ "top": null,
609
+ "visibility": null,
610
+ "width": null
611
+ }
612
+ },
613
+ "06ca0c50c53c4d4da485ff88bf94299b": {
614
+ "model_module": "@jupyter-widgets/controls",
615
+ "model_name": "DescriptionStyleModel",
616
+ "model_module_version": "1.5.0",
617
+ "state": {
618
+ "_model_module": "@jupyter-widgets/controls",
619
+ "_model_module_version": "1.5.0",
620
+ "_model_name": "DescriptionStyleModel",
621
+ "_view_count": null,
622
+ "_view_module": "@jupyter-widgets/base",
623
+ "_view_module_version": "1.2.0",
624
+ "_view_name": "StyleView",
625
+ "description_width": ""
626
+ }
627
+ },
628
+ "8d2fc30851ab4972a0fc9763f81ed088": {
629
+ "model_module": "@jupyter-widgets/controls",
630
+ "model_name": "LabelModel",
631
+ "model_module_version": "1.5.0",
632
+ "state": {
633
+ "_dom_classes": [],
634
+ "_model_module": "@jupyter-widgets/controls",
635
+ "_model_module_version": "1.5.0",
636
+ "_model_name": "LabelModel",
637
+ "_view_count": null,
638
+ "_view_module": "@jupyter-widgets/controls",
639
+ "_view_module_version": "1.5.0",
640
+ "_view_name": "LabelView",
641
+ "description": "",
642
+ "description_tooltip": null,
643
+ "layout": "IPY_MODEL_143ec709013d414d833cbd3ed2a0f74f",
644
+ "placeholder": "​",
645
+ "style": "IPY_MODEL_f4d5c9d24b5a493ea78664e94ea25515",
646
+ "value": "Token is valid (permission: write)."
647
+ }
648
+ },
649
+ "6c9471e6455a4245a9fa731ef480041d": {
650
+ "model_module": "@jupyter-widgets/controls",
651
+ "model_name": "LabelModel",
652
+ "model_module_version": "1.5.0",
653
+ "state": {
654
+ "_dom_classes": [],
655
+ "_model_module": "@jupyter-widgets/controls",
656
+ "_model_module_version": "1.5.0",
657
+ "_model_name": "LabelModel",
658
+ "_view_count": null,
659
+ "_view_module": "@jupyter-widgets/controls",
660
+ "_view_module_version": "1.5.0",
661
+ "_view_name": "LabelView",
662
+ "description": "",
663
+ "description_tooltip": null,
664
+ "layout": "IPY_MODEL_afb3c41f45414f52baa9f9a9f7c7736b",
665
+ "placeholder": "​",
666
+ "style": "IPY_MODEL_7fe879a2a8f44482871464fb054c1afb",
667
+ "value": "Your token has been saved in your configured git credential helpers (store)."
668
+ }
669
+ },
670
+ "e04732f9aee643378919f97ceed29a79": {
671
+ "model_module": "@jupyter-widgets/controls",
672
+ "model_name": "LabelModel",
673
+ "model_module_version": "1.5.0",
674
+ "state": {
675
+ "_dom_classes": [],
676
+ "_model_module": "@jupyter-widgets/controls",
677
+ "_model_module_version": "1.5.0",
678
+ "_model_name": "LabelModel",
679
+ "_view_count": null,
680
+ "_view_module": "@jupyter-widgets/controls",
681
+ "_view_module_version": "1.5.0",
682
+ "_view_name": "LabelView",
683
+ "description": "",
684
+ "description_tooltip": null,
685
+ "layout": "IPY_MODEL_4d240fcf5631432fb0ee8341f71856ac",
686
+ "placeholder": "​",
687
+ "style": "IPY_MODEL_94433bd4dd0c4eb0bc111e6528581bea",
688
+ "value": "Your token has been saved to /root/.cache/huggingface/token"
689
+ }
690
+ },
691
+ "865a67dd6e0c4b779a6bb41a8bd06882": {
692
+ "model_module": "@jupyter-widgets/controls",
693
+ "model_name": "LabelModel",
694
+ "model_module_version": "1.5.0",
695
+ "state": {
696
+ "_dom_classes": [],
697
+ "_model_module": "@jupyter-widgets/controls",
698
+ "_model_module_version": "1.5.0",
699
+ "_model_name": "LabelModel",
700
+ "_view_count": null,
701
+ "_view_module": "@jupyter-widgets/controls",
702
+ "_view_module_version": "1.5.0",
703
+ "_view_name": "LabelView",
704
+ "description": "",
705
+ "description_tooltip": null,
706
+ "layout": "IPY_MODEL_c39370639cdd41d18156303bc54f21f7",
707
+ "placeholder": "​",
708
+ "style": "IPY_MODEL_eee463d63f2d4c489f09a501ce5c387e",
709
+ "value": "Login successful"
710
+ }
711
+ },
712
+ "143ec709013d414d833cbd3ed2a0f74f": {
713
+ "model_module": "@jupyter-widgets/base",
714
+ "model_name": "LayoutModel",
715
+ "model_module_version": "1.2.0",
716
+ "state": {
717
+ "_model_module": "@jupyter-widgets/base",
718
+ "_model_module_version": "1.2.0",
719
+ "_model_name": "LayoutModel",
720
+ "_view_count": null,
721
+ "_view_module": "@jupyter-widgets/base",
722
+ "_view_module_version": "1.2.0",
723
+ "_view_name": "LayoutView",
724
+ "align_content": null,
725
+ "align_items": null,
726
+ "align_self": null,
727
+ "border": null,
728
+ "bottom": null,
729
+ "display": null,
730
+ "flex": null,
731
+ "flex_flow": null,
732
+ "grid_area": null,
733
+ "grid_auto_columns": null,
734
+ "grid_auto_flow": null,
735
+ "grid_auto_rows": null,
736
+ "grid_column": null,
737
+ "grid_gap": null,
738
+ "grid_row": null,
739
+ "grid_template_areas": null,
740
+ "grid_template_columns": null,
741
+ "grid_template_rows": null,
742
+ "height": null,
743
+ "justify_content": null,
744
+ "justify_items": null,
745
+ "left": null,
746
+ "margin": null,
747
+ "max_height": null,
748
+ "max_width": null,
749
+ "min_height": null,
750
+ "min_width": null,
751
+ "object_fit": null,
752
+ "object_position": null,
753
+ "order": null,
754
+ "overflow": null,
755
+ "overflow_x": null,
756
+ "overflow_y": null,
757
+ "padding": null,
758
+ "right": null,
759
+ "top": null,
760
+ "visibility": null,
761
+ "width": null
762
+ }
763
+ },
764
+ "f4d5c9d24b5a493ea78664e94ea25515": {
765
+ "model_module": "@jupyter-widgets/controls",
766
+ "model_name": "DescriptionStyleModel",
767
+ "model_module_version": "1.5.0",
768
+ "state": {
769
+ "_model_module": "@jupyter-widgets/controls",
770
+ "_model_module_version": "1.5.0",
771
+ "_model_name": "DescriptionStyleModel",
772
+ "_view_count": null,
773
+ "_view_module": "@jupyter-widgets/base",
774
+ "_view_module_version": "1.2.0",
775
+ "_view_name": "StyleView",
776
+ "description_width": ""
777
+ }
778
+ },
779
+ "afb3c41f45414f52baa9f9a9f7c7736b": {
780
+ "model_module": "@jupyter-widgets/base",
781
+ "model_name": "LayoutModel",
782
+ "model_module_version": "1.2.0",
783
+ "state": {
784
+ "_model_module": "@jupyter-widgets/base",
785
+ "_model_module_version": "1.2.0",
786
+ "_model_name": "LayoutModel",
787
+ "_view_count": null,
788
+ "_view_module": "@jupyter-widgets/base",
789
+ "_view_module_version": "1.2.0",
790
+ "_view_name": "LayoutView",
791
+ "align_content": null,
792
+ "align_items": null,
793
+ "align_self": null,
794
+ "border": null,
795
+ "bottom": null,
796
+ "display": null,
797
+ "flex": null,
798
+ "flex_flow": null,
799
+ "grid_area": null,
800
+ "grid_auto_columns": null,
801
+ "grid_auto_flow": null,
802
+ "grid_auto_rows": null,
803
+ "grid_column": null,
804
+ "grid_gap": null,
805
+ "grid_row": null,
806
+ "grid_template_areas": null,
807
+ "grid_template_columns": null,
808
+ "grid_template_rows": null,
809
+ "height": null,
810
+ "justify_content": null,
811
+ "justify_items": null,
812
+ "left": null,
813
+ "margin": null,
814
+ "max_height": null,
815
+ "max_width": null,
816
+ "min_height": null,
817
+ "min_width": null,
818
+ "object_fit": null,
819
+ "object_position": null,
820
+ "order": null,
821
+ "overflow": null,
822
+ "overflow_x": null,
823
+ "overflow_y": null,
824
+ "padding": null,
825
+ "right": null,
826
+ "top": null,
827
+ "visibility": null,
828
+ "width": null
829
+ }
830
+ },
831
+ "7fe879a2a8f44482871464fb054c1afb": {
832
+ "model_module": "@jupyter-widgets/controls",
833
+ "model_name": "DescriptionStyleModel",
834
+ "model_module_version": "1.5.0",
835
+ "state": {
836
+ "_model_module": "@jupyter-widgets/controls",
837
+ "_model_module_version": "1.5.0",
838
+ "_model_name": "DescriptionStyleModel",
839
+ "_view_count": null,
840
+ "_view_module": "@jupyter-widgets/base",
841
+ "_view_module_version": "1.2.0",
842
+ "_view_name": "StyleView",
843
+ "description_width": ""
844
+ }
845
+ },
846
+ "4d240fcf5631432fb0ee8341f71856ac": {
847
+ "model_module": "@jupyter-widgets/base",
848
+ "model_name": "LayoutModel",
849
+ "model_module_version": "1.2.0",
850
+ "state": {
851
+ "_model_module": "@jupyter-widgets/base",
852
+ "_model_module_version": "1.2.0",
853
+ "_model_name": "LayoutModel",
854
+ "_view_count": null,
855
+ "_view_module": "@jupyter-widgets/base",
856
+ "_view_module_version": "1.2.0",
857
+ "_view_name": "LayoutView",
858
+ "align_content": null,
859
+ "align_items": null,
860
+ "align_self": null,
861
+ "border": null,
862
+ "bottom": null,
863
+ "display": null,
864
+ "flex": null,
865
+ "flex_flow": null,
866
+ "grid_area": null,
867
+ "grid_auto_columns": null,
868
+ "grid_auto_flow": null,
869
+ "grid_auto_rows": null,
870
+ "grid_column": null,
871
+ "grid_gap": null,
872
+ "grid_row": null,
873
+ "grid_template_areas": null,
874
+ "grid_template_columns": null,
875
+ "grid_template_rows": null,
876
+ "height": null,
877
+ "justify_content": null,
878
+ "justify_items": null,
879
+ "left": null,
880
+ "margin": null,
881
+ "max_height": null,
882
+ "max_width": null,
883
+ "min_height": null,
884
+ "min_width": null,
885
+ "object_fit": null,
886
+ "object_position": null,
887
+ "order": null,
888
+ "overflow": null,
889
+ "overflow_x": null,
890
+ "overflow_y": null,
891
+ "padding": null,
892
+ "right": null,
893
+ "top": null,
894
+ "visibility": null,
895
+ "width": null
896
+ }
897
+ },
898
+ "94433bd4dd0c4eb0bc111e6528581bea": {
899
+ "model_module": "@jupyter-widgets/controls",
900
+ "model_name": "DescriptionStyleModel",
901
+ "model_module_version": "1.5.0",
902
+ "state": {
903
+ "_model_module": "@jupyter-widgets/controls",
904
+ "_model_module_version": "1.5.0",
905
+ "_model_name": "DescriptionStyleModel",
906
+ "_view_count": null,
907
+ "_view_module": "@jupyter-widgets/base",
908
+ "_view_module_version": "1.2.0",
909
+ "_view_name": "StyleView",
910
+ "description_width": ""
911
+ }
912
+ },
913
+ "c39370639cdd41d18156303bc54f21f7": {
914
+ "model_module": "@jupyter-widgets/base",
915
+ "model_name": "LayoutModel",
916
+ "model_module_version": "1.2.0",
917
+ "state": {
918
+ "_model_module": "@jupyter-widgets/base",
919
+ "_model_module_version": "1.2.0",
920
+ "_model_name": "LayoutModel",
921
+ "_view_count": null,
922
+ "_view_module": "@jupyter-widgets/base",
923
+ "_view_module_version": "1.2.0",
924
+ "_view_name": "LayoutView",
925
+ "align_content": null,
926
+ "align_items": null,
927
+ "align_self": null,
928
+ "border": null,
929
+ "bottom": null,
930
+ "display": null,
931
+ "flex": null,
932
+ "flex_flow": null,
933
+ "grid_area": null,
934
+ "grid_auto_columns": null,
935
+ "grid_auto_flow": null,
936
+ "grid_auto_rows": null,
937
+ "grid_column": null,
938
+ "grid_gap": null,
939
+ "grid_row": null,
940
+ "grid_template_areas": null,
941
+ "grid_template_columns": null,
942
+ "grid_template_rows": null,
943
+ "height": null,
944
+ "justify_content": null,
945
+ "justify_items": null,
946
+ "left": null,
947
+ "margin": null,
948
+ "max_height": null,
949
+ "max_width": null,
950
+ "min_height": null,
951
+ "min_width": null,
952
+ "object_fit": null,
953
+ "object_position": null,
954
+ "order": null,
955
+ "overflow": null,
956
+ "overflow_x": null,
957
+ "overflow_y": null,
958
+ "padding": null,
959
+ "right": null,
960
+ "top": null,
961
+ "visibility": null,
962
+ "width": null
963
+ }
964
+ },
965
+ "eee463d63f2d4c489f09a501ce5c387e": {
966
+ "model_module": "@jupyter-widgets/controls",
967
+ "model_name": "DescriptionStyleModel",
968
+ "model_module_version": "1.5.0",
969
+ "state": {
970
+ "_model_module": "@jupyter-widgets/controls",
971
+ "_model_module_version": "1.5.0",
972
+ "_model_name": "DescriptionStyleModel",
973
+ "_view_count": null,
974
+ "_view_module": "@jupyter-widgets/base",
975
+ "_view_module_version": "1.2.0",
976
+ "_view_name": "StyleView",
977
+ "description_width": ""
978
+ }
979
+ },
980
+ "f403a8090a6646a5b24bd3f1a482a466": {
981
+ "model_module": "@jupyter-widgets/controls",
982
+ "model_name": "HBoxModel",
983
+ "model_module_version": "1.5.0",
984
+ "state": {
985
+ "_dom_classes": [],
986
+ "_model_module": "@jupyter-widgets/controls",
987
+ "_model_module_version": "1.5.0",
988
+ "_model_name": "HBoxModel",
989
+ "_view_count": null,
990
+ "_view_module": "@jupyter-widgets/controls",
991
+ "_view_module_version": "1.5.0",
992
+ "_view_name": "HBoxView",
993
+ "box_style": "",
994
+ "children": [
995
+ "IPY_MODEL_7c5e45acf4f44fbbbe42ba6ae0d1a00b",
996
+ "IPY_MODEL_241d22a572d14deeb99cf23d32b15437",
997
+ "IPY_MODEL_833282adf0374866a2e923ba2d89ed54"
998
+ ],
999
+ "layout": "IPY_MODEL_92893ea5925a416496dbb5f0f6cc5fe4"
1000
+ }
1001
+ },
1002
+ "7c5e45acf4f44fbbbe42ba6ae0d1a00b": {
1003
+ "model_module": "@jupyter-widgets/controls",
1004
+ "model_name": "HTMLModel",
1005
+ "model_module_version": "1.5.0",
1006
+ "state": {
1007
+ "_dom_classes": [],
1008
+ "_model_module": "@jupyter-widgets/controls",
1009
+ "_model_module_version": "1.5.0",
1010
+ "_model_name": "HTMLModel",
1011
+ "_view_count": null,
1012
+ "_view_module": "@jupyter-widgets/controls",
1013
+ "_view_module_version": "1.5.0",
1014
+ "_view_name": "HTMLView",
1015
+ "description": "",
1016
+ "description_tooltip": null,
1017
+ "layout": "IPY_MODEL_b965c7efbf2c4bb59f6d6339bca638aa",
1018
+ "placeholder": "​",
1019
+ "style": "IPY_MODEL_8543bc719912446a956bc1df364892dc",
1020
+ "value": "model.safetensors: 100%"
1021
+ }
1022
+ },
1023
+ "241d22a572d14deeb99cf23d32b15437": {
1024
+ "model_module": "@jupyter-widgets/controls",
1025
+ "model_name": "FloatProgressModel",
1026
+ "model_module_version": "1.5.0",
1027
+ "state": {
1028
+ "_dom_classes": [],
1029
+ "_model_module": "@jupyter-widgets/controls",
1030
+ "_model_module_version": "1.5.0",
1031
+ "_model_name": "FloatProgressModel",
1032
+ "_view_count": null,
1033
+ "_view_module": "@jupyter-widgets/controls",
1034
+ "_view_module_version": "1.5.0",
1035
+ "_view_name": "ProgressView",
1036
+ "bar_style": "success",
1037
+ "description": "",
1038
+ "description_tooltip": null,
1039
+ "layout": "IPY_MODEL_7df787a07b5442cf9995c0e239c65c25",
1040
+ "max": 497774208,
1041
+ "min": 0,
1042
+ "orientation": "horizontal",
1043
+ "style": "IPY_MODEL_1b93b372a091455b90d7aee81706868d",
1044
+ "value": 497774208
1045
+ }
1046
+ },
1047
+ "833282adf0374866a2e923ba2d89ed54": {
1048
+ "model_module": "@jupyter-widgets/controls",
1049
+ "model_name": "HTMLModel",
1050
+ "model_module_version": "1.5.0",
1051
+ "state": {
1052
+ "_dom_classes": [],
1053
+ "_model_module": "@jupyter-widgets/controls",
1054
+ "_model_module_version": "1.5.0",
1055
+ "_model_name": "HTMLModel",
1056
+ "_view_count": null,
1057
+ "_view_module": "@jupyter-widgets/controls",
1058
+ "_view_module_version": "1.5.0",
1059
+ "_view_name": "HTMLView",
1060
+ "description": "",
1061
+ "description_tooltip": null,
1062
+ "layout": "IPY_MODEL_dccf8ecf30d94f3ca449bf2f681683c7",
1063
+ "placeholder": "​",
1064
+ "style": "IPY_MODEL_0ffd8ed4d4e84c2eae4837978e6dfdcf",
1065
+ "value": " 498M/498M [00:27&lt;00:00, 30.2MB/s]"
1066
+ }
1067
+ },
1068
+ "92893ea5925a416496dbb5f0f6cc5fe4": {
1069
+ "model_module": "@jupyter-widgets/base",
1070
+ "model_name": "LayoutModel",
1071
+ "model_module_version": "1.2.0",
1072
+ "state": {
1073
+ "_model_module": "@jupyter-widgets/base",
1074
+ "_model_module_version": "1.2.0",
1075
+ "_model_name": "LayoutModel",
1076
+ "_view_count": null,
1077
+ "_view_module": "@jupyter-widgets/base",
1078
+ "_view_module_version": "1.2.0",
1079
+ "_view_name": "LayoutView",
1080
+ "align_content": null,
1081
+ "align_items": null,
1082
+ "align_self": null,
1083
+ "border": null,
1084
+ "bottom": null,
1085
+ "display": null,
1086
+ "flex": null,
1087
+ "flex_flow": null,
1088
+ "grid_area": null,
1089
+ "grid_auto_columns": null,
1090
+ "grid_auto_flow": null,
1091
+ "grid_auto_rows": null,
1092
+ "grid_column": null,
1093
+ "grid_gap": null,
1094
+ "grid_row": null,
1095
+ "grid_template_areas": null,
1096
+ "grid_template_columns": null,
1097
+ "grid_template_rows": null,
1098
+ "height": null,
1099
+ "justify_content": null,
1100
+ "justify_items": null,
1101
+ "left": null,
1102
+ "margin": null,
1103
+ "max_height": null,
1104
+ "max_width": null,
1105
+ "min_height": null,
1106
+ "min_width": null,
1107
+ "object_fit": null,
1108
+ "object_position": null,
1109
+ "order": null,
1110
+ "overflow": null,
1111
+ "overflow_x": null,
1112
+ "overflow_y": null,
1113
+ "padding": null,
1114
+ "right": null,
1115
+ "top": null,
1116
+ "visibility": null,
1117
+ "width": null
1118
+ }
1119
+ },
1120
+ "b965c7efbf2c4bb59f6d6339bca638aa": {
1121
+ "model_module": "@jupyter-widgets/base",
1122
+ "model_name": "LayoutModel",
1123
+ "model_module_version": "1.2.0",
1124
+ "state": {
1125
+ "_model_module": "@jupyter-widgets/base",
1126
+ "_model_module_version": "1.2.0",
1127
+ "_model_name": "LayoutModel",
1128
+ "_view_count": null,
1129
+ "_view_module": "@jupyter-widgets/base",
1130
+ "_view_module_version": "1.2.0",
1131
+ "_view_name": "LayoutView",
1132
+ "align_content": null,
1133
+ "align_items": null,
1134
+ "align_self": null,
1135
+ "border": null,
1136
+ "bottom": null,
1137
+ "display": null,
1138
+ "flex": null,
1139
+ "flex_flow": null,
1140
+ "grid_area": null,
1141
+ "grid_auto_columns": null,
1142
+ "grid_auto_flow": null,
1143
+ "grid_auto_rows": null,
1144
+ "grid_column": null,
1145
+ "grid_gap": null,
1146
+ "grid_row": null,
1147
+ "grid_template_areas": null,
1148
+ "grid_template_columns": null,
1149
+ "grid_template_rows": null,
1150
+ "height": null,
1151
+ "justify_content": null,
1152
+ "justify_items": null,
1153
+ "left": null,
1154
+ "margin": null,
1155
+ "max_height": null,
1156
+ "max_width": null,
1157
+ "min_height": null,
1158
+ "min_width": null,
1159
+ "object_fit": null,
1160
+ "object_position": null,
1161
+ "order": null,
1162
+ "overflow": null,
1163
+ "overflow_x": null,
1164
+ "overflow_y": null,
1165
+ "padding": null,
1166
+ "right": null,
1167
+ "top": null,
1168
+ "visibility": null,
1169
+ "width": null
1170
+ }
1171
+ },
1172
+ "8543bc719912446a956bc1df364892dc": {
1173
+ "model_module": "@jupyter-widgets/controls",
1174
+ "model_name": "DescriptionStyleModel",
1175
+ "model_module_version": "1.5.0",
1176
+ "state": {
1177
+ "_model_module": "@jupyter-widgets/controls",
1178
+ "_model_module_version": "1.5.0",
1179
+ "_model_name": "DescriptionStyleModel",
1180
+ "_view_count": null,
1181
+ "_view_module": "@jupyter-widgets/base",
1182
+ "_view_module_version": "1.2.0",
1183
+ "_view_name": "StyleView",
1184
+ "description_width": ""
1185
+ }
1186
+ },
1187
+ "7df787a07b5442cf9995c0e239c65c25": {
1188
+ "model_module": "@jupyter-widgets/base",
1189
+ "model_name": "LayoutModel",
1190
+ "model_module_version": "1.2.0",
1191
+ "state": {
1192
+ "_model_module": "@jupyter-widgets/base",
1193
+ "_model_module_version": "1.2.0",
1194
+ "_model_name": "LayoutModel",
1195
+ "_view_count": null,
1196
+ "_view_module": "@jupyter-widgets/base",
1197
+ "_view_module_version": "1.2.0",
1198
+ "_view_name": "LayoutView",
1199
+ "align_content": null,
1200
+ "align_items": null,
1201
+ "align_self": null,
1202
+ "border": null,
1203
+ "bottom": null,
1204
+ "display": null,
1205
+ "flex": null,
1206
+ "flex_flow": null,
1207
+ "grid_area": null,
1208
+ "grid_auto_columns": null,
1209
+ "grid_auto_flow": null,
1210
+ "grid_auto_rows": null,
1211
+ "grid_column": null,
1212
+ "grid_gap": null,
1213
+ "grid_row": null,
1214
+ "grid_template_areas": null,
1215
+ "grid_template_columns": null,
1216
+ "grid_template_rows": null,
1217
+ "height": null,
1218
+ "justify_content": null,
1219
+ "justify_items": null,
1220
+ "left": null,
1221
+ "margin": null,
1222
+ "max_height": null,
1223
+ "max_width": null,
1224
+ "min_height": null,
1225
+ "min_width": null,
1226
+ "object_fit": null,
1227
+ "object_position": null,
1228
+ "order": null,
1229
+ "overflow": null,
1230
+ "overflow_x": null,
1231
+ "overflow_y": null,
1232
+ "padding": null,
1233
+ "right": null,
1234
+ "top": null,
1235
+ "visibility": null,
1236
+ "width": null
1237
+ }
1238
+ },
1239
+ "1b93b372a091455b90d7aee81706868d": {
1240
+ "model_module": "@jupyter-widgets/controls",
1241
+ "model_name": "ProgressStyleModel",
1242
+ "model_module_version": "1.5.0",
1243
+ "state": {
1244
+ "_model_module": "@jupyter-widgets/controls",
1245
+ "_model_module_version": "1.5.0",
1246
+ "_model_name": "ProgressStyleModel",
1247
+ "_view_count": null,
1248
+ "_view_module": "@jupyter-widgets/base",
1249
+ "_view_module_version": "1.2.0",
1250
+ "_view_name": "StyleView",
1251
+ "bar_color": null,
1252
+ "description_width": ""
1253
+ }
1254
+ },
1255
+ "dccf8ecf30d94f3ca449bf2f681683c7": {
1256
+ "model_module": "@jupyter-widgets/base",
1257
+ "model_name": "LayoutModel",
1258
+ "model_module_version": "1.2.0",
1259
+ "state": {
1260
+ "_model_module": "@jupyter-widgets/base",
1261
+ "_model_module_version": "1.2.0",
1262
+ "_model_name": "LayoutModel",
1263
+ "_view_count": null,
1264
+ "_view_module": "@jupyter-widgets/base",
1265
+ "_view_module_version": "1.2.0",
1266
+ "_view_name": "LayoutView",
1267
+ "align_content": null,
1268
+ "align_items": null,
1269
+ "align_self": null,
1270
+ "border": null,
1271
+ "bottom": null,
1272
+ "display": null,
1273
+ "flex": null,
1274
+ "flex_flow": null,
1275
+ "grid_area": null,
1276
+ "grid_auto_columns": null,
1277
+ "grid_auto_flow": null,
1278
+ "grid_auto_rows": null,
1279
+ "grid_column": null,
1280
+ "grid_gap": null,
1281
+ "grid_row": null,
1282
+ "grid_template_areas": null,
1283
+ "grid_template_columns": null,
1284
+ "grid_template_rows": null,
1285
+ "height": null,
1286
+ "justify_content": null,
1287
+ "justify_items": null,
1288
+ "left": null,
1289
+ "margin": null,
1290
+ "max_height": null,
1291
+ "max_width": null,
1292
+ "min_height": null,
1293
+ "min_width": null,
1294
+ "object_fit": null,
1295
+ "object_position": null,
1296
+ "order": null,
1297
+ "overflow": null,
1298
+ "overflow_x": null,
1299
+ "overflow_y": null,
1300
+ "padding": null,
1301
+ "right": null,
1302
+ "top": null,
1303
+ "visibility": null,
1304
+ "width": null
1305
+ }
1306
+ },
1307
+ "0ffd8ed4d4e84c2eae4837978e6dfdcf": {
1308
+ "model_module": "@jupyter-widgets/controls",
1309
+ "model_name": "DescriptionStyleModel",
1310
+ "model_module_version": "1.5.0",
1311
+ "state": {
1312
+ "_model_module": "@jupyter-widgets/controls",
1313
+ "_model_module_version": "1.5.0",
1314
+ "_model_name": "DescriptionStyleModel",
1315
+ "_view_count": null,
1316
+ "_view_module": "@jupyter-widgets/base",
1317
+ "_view_module_version": "1.2.0",
1318
+ "_view_name": "StyleView",
1319
+ "description_width": ""
1320
+ }
1321
+ },
1322
+ "1a8e5de3f44b4deb9815fe7dcac10f71": {
1323
+ "model_module": "@jupyter-widgets/controls",
1324
+ "model_name": "HBoxModel",
1325
+ "model_module_version": "1.5.0",
1326
+ "state": {
1327
+ "_dom_classes": [],
1328
+ "_model_module": "@jupyter-widgets/controls",
1329
+ "_model_module_version": "1.5.0",
1330
+ "_model_name": "HBoxModel",
1331
+ "_view_count": null,
1332
+ "_view_module": "@jupyter-widgets/controls",
1333
+ "_view_module_version": "1.5.0",
1334
+ "_view_name": "HBoxView",
1335
+ "box_style": "",
1336
+ "children": [
1337
+ "IPY_MODEL_15f90e6de63647a291899befc0912db8",
1338
+ "IPY_MODEL_288e7c00f27b421388f23f1255d01f2d",
1339
+ "IPY_MODEL_f57174571a494c4cb2074a904f3b86ce"
1340
+ ],
1341
+ "layout": "IPY_MODEL_8eb37b23513e49679dd5f12554a66295"
1342
+ }
1343
+ },
1344
+ "15f90e6de63647a291899befc0912db8": {
1345
+ "model_module": "@jupyter-widgets/controls",
1346
+ "model_name": "HTMLModel",
1347
+ "model_module_version": "1.5.0",
1348
+ "state": {
1349
+ "_dom_classes": [],
1350
+ "_model_module": "@jupyter-widgets/controls",
1351
+ "_model_module_version": "1.5.0",
1352
+ "_model_name": "HTMLModel",
1353
+ "_view_count": null,
1354
+ "_view_module": "@jupyter-widgets/controls",
1355
+ "_view_module_version": "1.5.0",
1356
+ "_view_name": "HTMLView",
1357
+ "description": "",
1358
+ "description_tooltip": null,
1359
+ "layout": "IPY_MODEL_de0b0d803dde4c8fa8bcd9eda5210420",
1360
+ "placeholder": "​",
1361
+ "style": "IPY_MODEL_3be10b8fc42749fdb522f3168952b3ea",
1362
+ "value": "README.md: 100%"
1363
+ }
1364
+ },
1365
+ "288e7c00f27b421388f23f1255d01f2d": {
1366
+ "model_module": "@jupyter-widgets/controls",
1367
+ "model_name": "FloatProgressModel",
1368
+ "model_module_version": "1.5.0",
1369
+ "state": {
1370
+ "_dom_classes": [],
1371
+ "_model_module": "@jupyter-widgets/controls",
1372
+ "_model_module_version": "1.5.0",
1373
+ "_model_name": "FloatProgressModel",
1374
+ "_view_count": null,
1375
+ "_view_module": "@jupyter-widgets/controls",
1376
+ "_view_module_version": "1.5.0",
1377
+ "_view_name": "ProgressView",
1378
+ "bar_style": "success",
1379
+ "description": "",
1380
+ "description_tooltip": null,
1381
+ "layout": "IPY_MODEL_d2895d4001b24dc6bc52f8ead03f77a3",
1382
+ "max": 2190,
1383
+ "min": 0,
1384
+ "orientation": "horizontal",
1385
+ "style": "IPY_MODEL_99962b09abe44dc7977f067371cf65ef",
1386
+ "value": 2190
1387
+ }
1388
+ },
1389
+ "f57174571a494c4cb2074a904f3b86ce": {
1390
+ "model_module": "@jupyter-widgets/controls",
1391
+ "model_name": "HTMLModel",
1392
+ "model_module_version": "1.5.0",
1393
+ "state": {
1394
+ "_dom_classes": [],
1395
+ "_model_module": "@jupyter-widgets/controls",
1396
+ "_model_module_version": "1.5.0",
1397
+ "_model_name": "HTMLModel",
1398
+ "_view_count": null,
1399
+ "_view_module": "@jupyter-widgets/controls",
1400
+ "_view_module_version": "1.5.0",
1401
+ "_view_name": "HTMLView",
1402
+ "description": "",
1403
+ "description_tooltip": null,
1404
+ "layout": "IPY_MODEL_e1434108affa47fa94b2680e72319099",
1405
+ "placeholder": "​",
1406
+ "style": "IPY_MODEL_91d6a93bbb374189be6d6b8a62c8ab9b",
1407
+ "value": " 2.19k/2.19k [00:00&lt;00:00, 197kB/s]"
1408
+ }
1409
+ },
1410
+ "8eb37b23513e49679dd5f12554a66295": {
1411
+ "model_module": "@jupyter-widgets/base",
1412
+ "model_name": "LayoutModel",
1413
+ "model_module_version": "1.2.0",
1414
+ "state": {
1415
+ "_model_module": "@jupyter-widgets/base",
1416
+ "_model_module_version": "1.2.0",
1417
+ "_model_name": "LayoutModel",
1418
+ "_view_count": null,
1419
+ "_view_module": "@jupyter-widgets/base",
1420
+ "_view_module_version": "1.2.0",
1421
+ "_view_name": "LayoutView",
1422
+ "align_content": null,
1423
+ "align_items": null,
1424
+ "align_self": null,
1425
+ "border": null,
1426
+ "bottom": null,
1427
+ "display": null,
1428
+ "flex": null,
1429
+ "flex_flow": null,
1430
+ "grid_area": null,
1431
+ "grid_auto_columns": null,
1432
+ "grid_auto_flow": null,
1433
+ "grid_auto_rows": null,
1434
+ "grid_column": null,
1435
+ "grid_gap": null,
1436
+ "grid_row": null,
1437
+ "grid_template_areas": null,
1438
+ "grid_template_columns": null,
1439
+ "grid_template_rows": null,
1440
+ "height": null,
1441
+ "justify_content": null,
1442
+ "justify_items": null,
1443
+ "left": null,
1444
+ "margin": null,
1445
+ "max_height": null,
1446
+ "max_width": null,
1447
+ "min_height": null,
1448
+ "min_width": null,
1449
+ "object_fit": null,
1450
+ "object_position": null,
1451
+ "order": null,
1452
+ "overflow": null,
1453
+ "overflow_x": null,
1454
+ "overflow_y": null,
1455
+ "padding": null,
1456
+ "right": null,
1457
+ "top": null,
1458
+ "visibility": null,
1459
+ "width": null
1460
+ }
1461
+ },
1462
+ "de0b0d803dde4c8fa8bcd9eda5210420": {
1463
+ "model_module": "@jupyter-widgets/base",
1464
+ "model_name": "LayoutModel",
1465
+ "model_module_version": "1.2.0",
1466
+ "state": {
1467
+ "_model_module": "@jupyter-widgets/base",
1468
+ "_model_module_version": "1.2.0",
1469
+ "_model_name": "LayoutModel",
1470
+ "_view_count": null,
1471
+ "_view_module": "@jupyter-widgets/base",
1472
+ "_view_module_version": "1.2.0",
1473
+ "_view_name": "LayoutView",
1474
+ "align_content": null,
1475
+ "align_items": null,
1476
+ "align_self": null,
1477
+ "border": null,
1478
+ "bottom": null,
1479
+ "display": null,
1480
+ "flex": null,
1481
+ "flex_flow": null,
1482
+ "grid_area": null,
1483
+ "grid_auto_columns": null,
1484
+ "grid_auto_flow": null,
1485
+ "grid_auto_rows": null,
1486
+ "grid_column": null,
1487
+ "grid_gap": null,
1488
+ "grid_row": null,
1489
+ "grid_template_areas": null,
1490
+ "grid_template_columns": null,
1491
+ "grid_template_rows": null,
1492
+ "height": null,
1493
+ "justify_content": null,
1494
+ "justify_items": null,
1495
+ "left": null,
1496
+ "margin": null,
1497
+ "max_height": null,
1498
+ "max_width": null,
1499
+ "min_height": null,
1500
+ "min_width": null,
1501
+ "object_fit": null,
1502
+ "object_position": null,
1503
+ "order": null,
1504
+ "overflow": null,
1505
+ "overflow_x": null,
1506
+ "overflow_y": null,
1507
+ "padding": null,
1508
+ "right": null,
1509
+ "top": null,
1510
+ "visibility": null,
1511
+ "width": null
1512
+ }
1513
+ },
1514
+ "3be10b8fc42749fdb522f3168952b3ea": {
1515
+ "model_module": "@jupyter-widgets/controls",
1516
+ "model_name": "DescriptionStyleModel",
1517
+ "model_module_version": "1.5.0",
1518
+ "state": {
1519
+ "_model_module": "@jupyter-widgets/controls",
1520
+ "_model_module_version": "1.5.0",
1521
+ "_model_name": "DescriptionStyleModel",
1522
+ "_view_count": null,
1523
+ "_view_module": "@jupyter-widgets/base",
1524
+ "_view_module_version": "1.2.0",
1525
+ "_view_name": "StyleView",
1526
+ "description_width": ""
1527
+ }
1528
+ },
1529
+ "d2895d4001b24dc6bc52f8ead03f77a3": {
1530
+ "model_module": "@jupyter-widgets/base",
1531
+ "model_name": "LayoutModel",
1532
+ "model_module_version": "1.2.0",
1533
+ "state": {
1534
+ "_model_module": "@jupyter-widgets/base",
1535
+ "_model_module_version": "1.2.0",
1536
+ "_model_name": "LayoutModel",
1537
+ "_view_count": null,
1538
+ "_view_module": "@jupyter-widgets/base",
1539
+ "_view_module_version": "1.2.0",
1540
+ "_view_name": "LayoutView",
1541
+ "align_content": null,
1542
+ "align_items": null,
1543
+ "align_self": null,
1544
+ "border": null,
1545
+ "bottom": null,
1546
+ "display": null,
1547
+ "flex": null,
1548
+ "flex_flow": null,
1549
+ "grid_area": null,
1550
+ "grid_auto_columns": null,
1551
+ "grid_auto_flow": null,
1552
+ "grid_auto_rows": null,
1553
+ "grid_column": null,
1554
+ "grid_gap": null,
1555
+ "grid_row": null,
1556
+ "grid_template_areas": null,
1557
+ "grid_template_columns": null,
1558
+ "grid_template_rows": null,
1559
+ "height": null,
1560
+ "justify_content": null,
1561
+ "justify_items": null,
1562
+ "left": null,
1563
+ "margin": null,
1564
+ "max_height": null,
1565
+ "max_width": null,
1566
+ "min_height": null,
1567
+ "min_width": null,
1568
+ "object_fit": null,
1569
+ "object_position": null,
1570
+ "order": null,
1571
+ "overflow": null,
1572
+ "overflow_x": null,
1573
+ "overflow_y": null,
1574
+ "padding": null,
1575
+ "right": null,
1576
+ "top": null,
1577
+ "visibility": null,
1578
+ "width": null
1579
+ }
1580
+ },
1581
+ "99962b09abe44dc7977f067371cf65ef": {
1582
+ "model_module": "@jupyter-widgets/controls",
1583
+ "model_name": "ProgressStyleModel",
1584
+ "model_module_version": "1.5.0",
1585
+ "state": {
1586
+ "_model_module": "@jupyter-widgets/controls",
1587
+ "_model_module_version": "1.5.0",
1588
+ "_model_name": "ProgressStyleModel",
1589
+ "_view_count": null,
1590
+ "_view_module": "@jupyter-widgets/base",
1591
+ "_view_module_version": "1.2.0",
1592
+ "_view_name": "StyleView",
1593
+ "bar_color": null,
1594
+ "description_width": ""
1595
+ }
1596
+ },
1597
+ "e1434108affa47fa94b2680e72319099": {
1598
+ "model_module": "@jupyter-widgets/base",
1599
+ "model_name": "LayoutModel",
1600
+ "model_module_version": "1.2.0",
1601
+ "state": {
1602
+ "_model_module": "@jupyter-widgets/base",
1603
+ "_model_module_version": "1.2.0",
1604
+ "_model_name": "LayoutModel",
1605
+ "_view_count": null,
1606
+ "_view_module": "@jupyter-widgets/base",
1607
+ "_view_module_version": "1.2.0",
1608
+ "_view_name": "LayoutView",
1609
+ "align_content": null,
1610
+ "align_items": null,
1611
+ "align_self": null,
1612
+ "border": null,
1613
+ "bottom": null,
1614
+ "display": null,
1615
+ "flex": null,
1616
+ "flex_flow": null,
1617
+ "grid_area": null,
1618
+ "grid_auto_columns": null,
1619
+ "grid_auto_flow": null,
1620
+ "grid_auto_rows": null,
1621
+ "grid_column": null,
1622
+ "grid_gap": null,
1623
+ "grid_row": null,
1624
+ "grid_template_areas": null,
1625
+ "grid_template_columns": null,
1626
+ "grid_template_rows": null,
1627
+ "height": null,
1628
+ "justify_content": null,
1629
+ "justify_items": null,
1630
+ "left": null,
1631
+ "margin": null,
1632
+ "max_height": null,
1633
+ "max_width": null,
1634
+ "min_height": null,
1635
+ "min_width": null,
1636
+ "object_fit": null,
1637
+ "object_position": null,
1638
+ "order": null,
1639
+ "overflow": null,
1640
+ "overflow_x": null,
1641
+ "overflow_y": null,
1642
+ "padding": null,
1643
+ "right": null,
1644
+ "top": null,
1645
+ "visibility": null,
1646
+ "width": null
1647
+ }
1648
+ },
1649
+ "91d6a93bbb374189be6d6b8a62c8ab9b": {
1650
+ "model_module": "@jupyter-widgets/controls",
1651
+ "model_name": "DescriptionStyleModel",
1652
+ "model_module_version": "1.5.0",
1653
+ "state": {
1654
+ "_model_module": "@jupyter-widgets/controls",
1655
+ "_model_module_version": "1.5.0",
1656
+ "_model_name": "DescriptionStyleModel",
1657
+ "_view_count": null,
1658
+ "_view_module": "@jupyter-widgets/base",
1659
+ "_view_module_version": "1.2.0",
1660
+ "_view_name": "StyleView",
1661
+ "description_width": ""
1662
+ }
1663
+ }
1664
+ }
1665
+ }
1666
+ },
1667
+ "cells": [
1668
+ {
1669
+ "cell_type": "markdown",
1670
+ "source": [
1671
+ "# Installing Dependencies"
1672
+ ],
1673
+ "metadata": {
1674
+ "id": "_F3_7tgFKPn5"
1675
+ }
1676
+ },
1677
+ {
1678
+ "cell_type": "code",
1679
+ "source": [
1680
+ "!pip install transformers datasets torch accelerate huggingface_hub"
1681
+ ],
1682
+ "metadata": {
1683
+ "colab": {
1684
+ "base_uri": "https://localhost:8080/"
1685
+ },
1686
+ "id": "8k3qYvLn8zE0",
1687
+ "outputId": "0c3e5c62-b3f1-43f9-cbc8-509011f68fa9"
1688
+ },
1689
+ "execution_count": 1,
1690
+ "outputs": [
1691
+ {
1692
+ "output_type": "stream",
1693
+ "name": "stdout",
1694
+ "text": [
1695
+ "Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.40.1)\n",
1696
+ "Collecting datasets\n",
1697
+ " Downloading datasets-2.19.1-py3-none-any.whl (542 kB)\n",
1698
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m542.0/542.0 kB\u001b[0m \u001b[31m9.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1699
+ "\u001b[?25hRequirement already satisfied: torch in /usr/local/lib/python3.10/dist-packages (2.2.1+cu121)\n",
1700
+ "Collecting accelerate\n",
1701
+ " Downloading accelerate-0.30.0-py3-none-any.whl (302 kB)\n",
1702
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m302.4/302.4 kB\u001b[0m \u001b[31m33.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1703
+ "\u001b[?25hRequirement already satisfied: huggingface_hub in /usr/local/lib/python3.10/dist-packages (0.20.3)\n",
1704
+ "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.14.0)\n",
1705
+ "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.25.2)\n",
1706
+ "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (24.0)\n",
1707
+ "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n",
1708
+ "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.12.25)\n",
1709
+ "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n",
1710
+ "Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.19.1)\n",
1711
+ "Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.4.3)\n",
1712
+ "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.4)\n",
1713
+ "Requirement already satisfied: pyarrow>=12.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (14.0.2)\n",
1714
+ "Requirement already satisfied: pyarrow-hotfix in /usr/local/lib/python3.10/dist-packages (from datasets) (0.6)\n",
1715
+ "Collecting dill<0.3.9,>=0.3.0 (from datasets)\n",
1716
+ " Downloading dill-0.3.8-py3-none-any.whl (116 kB)\n",
1717
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m12.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1718
+ "\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (2.0.3)\n",
1719
+ "Collecting xxhash (from datasets)\n",
1720
+ " Downloading xxhash-3.4.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)\n",
1721
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m11.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1722
+ "\u001b[?25hCollecting multiprocess (from datasets)\n",
1723
+ " Downloading multiprocess-0.70.16-py310-none-any.whl (134 kB)\n",
1724
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m15.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1725
+ "\u001b[?25hRequirement already satisfied: fsspec[http]<=2024.3.1,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n",
1726
+ "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.9.5)\n",
1727
+ "Collecting huggingface_hub\n",
1728
+ " Downloading huggingface_hub-0.23.0-py3-none-any.whl (401 kB)\n",
1729
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m401.2/401.2 kB\u001b[0m \u001b[31m36.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
1730
+ "\u001b[?25hRequirement already satisfied: typing-extensions>=4.8.0 in /usr/local/lib/python3.10/dist-packages (from torch) (4.11.0)\n",
1731
+ "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch) (1.12)\n",
1732
+ "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch) (3.3)\n",
1733
+ "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch) (3.1.3)\n",
1734
+ "Collecting nvidia-cuda-nvrtc-cu12==12.1.105 (from torch)\n",
1735
+ " Using cached nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (23.7 MB)\n",
1736
+ "Collecting nvidia-cuda-runtime-cu12==12.1.105 (from torch)\n",
1737
+ " Using cached nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (823 kB)\n",
1738
+ "Collecting nvidia-cuda-cupti-cu12==12.1.105 (from torch)\n",
1739
+ " Using cached nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (14.1 MB)\n",
1740
+ "Collecting nvidia-cudnn-cu12==8.9.2.26 (from torch)\n",
1741
+ " Using cached nvidia_cudnn_cu12-8.9.2.26-py3-none-manylinux1_x86_64.whl (731.7 MB)\n",
1742
+ "Collecting nvidia-cublas-cu12==12.1.3.1 (from torch)\n",
1743
+ " Using cached nvidia_cublas_cu12-12.1.3.1-py3-none-manylinux1_x86_64.whl (410.6 MB)\n",
1744
+ "Collecting nvidia-cufft-cu12==11.0.2.54 (from torch)\n",
1745
+ " Using cached nvidia_cufft_cu12-11.0.2.54-py3-none-manylinux1_x86_64.whl (121.6 MB)\n",
1746
+ "Collecting nvidia-curand-cu12==10.3.2.106 (from torch)\n",
1747
+ " Using cached nvidia_curand_cu12-10.3.2.106-py3-none-manylinux1_x86_64.whl (56.5 MB)\n",
1748
+ "Collecting nvidia-cusolver-cu12==11.4.5.107 (from torch)\n",
1749
+ " Using cached nvidia_cusolver_cu12-11.4.5.107-py3-none-manylinux1_x86_64.whl (124.2 MB)\n",
1750
+ "Collecting nvidia-cusparse-cu12==12.1.0.106 (from torch)\n",
1751
+ " Using cached nvidia_cusparse_cu12-12.1.0.106-py3-none-manylinux1_x86_64.whl (196.0 MB)\n",
1752
+ "Collecting nvidia-nccl-cu12==2.19.3 (from torch)\n",
1753
+ " Using cached nvidia_nccl_cu12-2.19.3-py3-none-manylinux1_x86_64.whl (166.0 MB)\n",
1754
+ "Collecting nvidia-nvtx-cu12==12.1.105 (from torch)\n",
1755
+ " Using cached nvidia_nvtx_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (99 kB)\n",
1756
+ "Requirement already satisfied: triton==2.2.0 in /usr/local/lib/python3.10/dist-packages (from torch) (2.2.0)\n",
1757
+ "Collecting nvidia-nvjitlink-cu12 (from nvidia-cusolver-cu12==11.4.5.107->torch)\n",
1758
+ " Using cached nvidia_nvjitlink_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl (21.1 MB)\n",
1759
+ "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n",
1760
+ "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n",
1761
+ "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.2.0)\n",
1762
+ "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.4.1)\n",
1763
+ "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.5)\n",
1764
+ "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.4)\n",
1765
+ "Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.3)\n",
1766
+ "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.3.2)\n",
1767
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.7)\n",
1768
+ "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.7)\n",
1769
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2024.2.2)\n",
1770
+ "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch) (2.1.5)\n",
1771
+ "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n",
1772
+ "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2023.4)\n",
1773
+ "Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2024.1)\n",
1774
+ "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch) (1.3.0)\n",
1775
+ "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas->datasets) (1.16.0)\n",
1776
+ "Installing collected packages: xxhash, nvidia-nvtx-cu12, nvidia-nvjitlink-cu12, nvidia-nccl-cu12, nvidia-curand-cu12, nvidia-cufft-cu12, nvidia-cuda-runtime-cu12, nvidia-cuda-nvrtc-cu12, nvidia-cuda-cupti-cu12, nvidia-cublas-cu12, dill, nvidia-cusparse-cu12, nvidia-cudnn-cu12, multiprocess, huggingface_hub, nvidia-cusolver-cu12, datasets, accelerate\n",
1777
+ " Attempting uninstall: huggingface_hub\n",
1778
+ " Found existing installation: huggingface-hub 0.20.3\n",
1779
+ " Uninstalling huggingface-hub-0.20.3:\n",
1780
+ " Successfully uninstalled huggingface-hub-0.20.3\n",
1781
+ "Successfully installed accelerate-0.30.0 datasets-2.19.1 dill-0.3.8 huggingface_hub-0.23.0 multiprocess-0.70.16 nvidia-cublas-cu12-12.1.3.1 nvidia-cuda-cupti-cu12-12.1.105 nvidia-cuda-nvrtc-cu12-12.1.105 nvidia-cuda-runtime-cu12-12.1.105 nvidia-cudnn-cu12-8.9.2.26 nvidia-cufft-cu12-11.0.2.54 nvidia-curand-cu12-10.3.2.106 nvidia-cusolver-cu12-11.4.5.107 nvidia-cusparse-cu12-12.1.0.106 nvidia-nccl-cu12-2.19.3 nvidia-nvjitlink-cu12-12.4.127 nvidia-nvtx-cu12-12.1.105 xxhash-3.4.1\n"
1782
+ ]
1783
+ }
1784
+ ]
1785
+ },
1786
+ {
1787
+ "cell_type": "code",
1788
+ "source": [
1789
+ "from huggingface_hub import notebook_login\n",
1790
+ "notebook_login()"
1791
+ ],
1792
+ "metadata": {
1793
+ "colab": {
1794
+ "base_uri": "https://localhost:8080/",
1795
+ "height": 145,
1796
+ "referenced_widgets": [
1797
+ "a268227e95cc46cda6c40f88f76729b4",
1798
+ "5d2b151866db434b9a97054136972c02",
1799
+ "26e2d737d2334bfaab84d7567957f98f",
1800
+ "f65f24dbbc8e43ddb98f786c70412088",
1801
+ "92abf62190e543a8bcf5cd497fb0594e",
1802
+ "3d9f52d2c3294ca4a83d91987387ff8c",
1803
+ "c3b6d6efc0bb4cebb43e54f1cac15398",
1804
+ "dfb07bd69a98467385a922d93dbbdf78",
1805
+ "b8c97b05b8cd41929982d3dfa4c0253e",
1806
+ "c14e7006466f465495524c631cb47296",
1807
+ "49eef402a9aa41c09b515ccd03b1ded4",
1808
+ "3af71b9541134fe9a62c1c3fe594062b",
1809
+ "aebc8baf9fc442bb86a849886c94eebd",
1810
+ "16c2e8011f0f45808960ab2b8bd53443",
1811
+ "7bb44167e92e4d73ac5ea1ced3d08110",
1812
+ "ebefb66192ce436cb6bdc2f6e889479c",
1813
+ "ce227eacf424429899de05839c6a09b4",
1814
+ "f453dda624134aaeb5aaa68280b16a14",
1815
+ "08187be630cf4f3c914cabcc2aec20dd",
1816
+ "06ca0c50c53c4d4da485ff88bf94299b",
1817
+ "8d2fc30851ab4972a0fc9763f81ed088",
1818
+ "6c9471e6455a4245a9fa731ef480041d",
1819
+ "e04732f9aee643378919f97ceed29a79",
1820
+ "865a67dd6e0c4b779a6bb41a8bd06882",
1821
+ "143ec709013d414d833cbd3ed2a0f74f",
1822
+ "f4d5c9d24b5a493ea78664e94ea25515",
1823
+ "afb3c41f45414f52baa9f9a9f7c7736b",
1824
+ "7fe879a2a8f44482871464fb054c1afb",
1825
+ "4d240fcf5631432fb0ee8341f71856ac",
1826
+ "94433bd4dd0c4eb0bc111e6528581bea",
1827
+ "c39370639cdd41d18156303bc54f21f7",
1828
+ "eee463d63f2d4c489f09a501ce5c387e"
1829
+ ]
1830
+ },
1831
+ "id": "i-M4tyTeKyU0",
1832
+ "outputId": "b6978682-9db0-4d19-cc99-ab6619e0972b"
1833
+ },
1834
+ "execution_count": 2,
1835
+ "outputs": [
1836
+ {
1837
+ "output_type": "display_data",
1838
+ "data": {
1839
+ "text/plain": [
1840
+ "VBox(children=(HTML(value='<center> <img\\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…"
1841
+ ],
1842
+ "application/vnd.jupyter.widget-view+json": {
1843
+ "version_major": 2,
1844
+ "version_minor": 0,
1845
+ "model_id": "a268227e95cc46cda6c40f88f76729b4"
1846
+ }
1847
+ },
1848
+ "metadata": {}
1849
+ }
1850
+ ]
1851
+ },
1852
+ {
1853
+ "cell_type": "markdown",
1854
+ "source": [
1855
+ "# Import Libraries"
1856
+ ],
1857
+ "metadata": {
1858
+ "id": "6qh-rhOOKd8U"
1859
+ }
1860
+ },
1861
+ {
1862
+ "cell_type": "code",
1863
+ "execution_count": 3,
1864
+ "metadata": {
1865
+ "id": "4OGeB2FM8fg5"
1866
+ },
1867
+ "outputs": [],
1868
+ "source": [
1869
+ "import torch\n",
1870
+ "from transformers import GPT2LMHeadModel, GPT2Tokenizer\n",
1871
+ "from transformers import TrainingArguments, Trainer\n",
1872
+ "from datasets import load_dataset, load_metric"
1873
+ ]
1874
+ },
1875
+ {
1876
+ "cell_type": "markdown",
1877
+ "source": [
1878
+ "# Import Model"
1879
+ ],
1880
+ "metadata": {
1881
+ "id": "MVbtM0vwKuOA"
1882
+ }
1883
+ },
1884
+ {
1885
+ "cell_type": "code",
1886
+ "source": [
1887
+ "model_name = \"gpt2\"\n",
1888
+ "model = GPT2LMHeadModel.from_pretrained(model_name)\n",
1889
+ "tokenizer = GPT2Tokenizer.from_pretrained(model_name)\n",
1890
+ "tokenizer.save_pretrained(\"./gpt2-evy\")"
1891
+ ],
1892
+ "metadata": {
1893
+ "id": "TouK-jYv_WQR",
1894
+ "colab": {
1895
+ "base_uri": "https://localhost:8080/"
1896
+ },
1897
+ "outputId": "4cab9491-e796-487c-f5bb-86535019242f"
1898
+ },
1899
+ "execution_count": 34,
1900
+ "outputs": [
1901
+ {
1902
+ "output_type": "stream",
1903
+ "name": "stderr",
1904
+ "text": [
1905
+ "/usr/local/lib/python3.10/dist-packages/huggingface_hub/file_download.py:1132: FutureWarning: `resume_download` is deprecated and will be removed in version 1.0.0. Downloads always resume when possible. If you want to force a new download, use `force_download=True`.\n",
1906
+ " warnings.warn(\n"
1907
+ ]
1908
+ },
1909
+ {
1910
+ "output_type": "execute_result",
1911
+ "data": {
1912
+ "text/plain": [
1913
+ "('./gpt2-evy/tokenizer_config.json',\n",
1914
+ " './gpt2-evy/special_tokens_map.json',\n",
1915
+ " './gpt2-evy/vocab.json',\n",
1916
+ " './gpt2-evy/merges.txt',\n",
1917
+ " './gpt2-evy/added_tokens.json')"
1918
+ ]
1919
+ },
1920
+ "metadata": {},
1921
+ "execution_count": 34
1922
+ }
1923
+ ]
1924
+ },
1925
+ {
1926
+ "cell_type": "code",
1927
+ "source": [
1928
+ "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
1929
+ "\n",
1930
+ "tokenizer.pad_token = tokenizer.eos_token\n",
1931
+ "\n",
1932
+ "dataset = load_dataset(\"joshcarp/evy-dataset\")\n",
1933
+ "\n",
1934
+ "train_data = dataset[\"train\"].select([i for i in range(len(dataset[\"train\"])) if i % 10 != 0]) # Use 90% of the data for training\n",
1935
+ "val_data = dataset[\"train\"].select([i for i in range(len(dataset[\"train\"])) if i % 10 == 0]) # Use 10% of the data for validation\n",
1936
+ "\n",
1937
+ "def tokenize_function(examples):\n",
1938
+ " inputs = tokenizer(examples['contents'], return_tensors='pt', padding='max_length', max_length=512, truncation=True)\n",
1939
+ " return {'input_ids': inputs['input_ids'], 'labels': inputs['input_ids']}\n",
1940
+ "\n",
1941
+ "train_data = train_data.map(tokenize_function, batched=True)\n",
1942
+ "val_data = val_data.map(tokenize_function, batched=True)"
1943
+ ],
1944
+ "metadata": {
1945
+ "id": "XaiAM37R_eu1"
1946
+ },
1947
+ "execution_count": 35,
1948
+ "outputs": []
1949
+ },
1950
+ {
1951
+ "cell_type": "code",
1952
+ "source": [
1953
+ "device"
1954
+ ],
1955
+ "metadata": {
1956
+ "colab": {
1957
+ "base_uri": "https://localhost:8080/"
1958
+ },
1959
+ "id": "0vW3LItNCQJY",
1960
+ "outputId": "1f9663d6-1dc4-46aa-b53b-1e7126b7f86e"
1961
+ },
1962
+ "execution_count": 17,
1963
+ "outputs": [
1964
+ {
1965
+ "output_type": "execute_result",
1966
+ "data": {
1967
+ "text/plain": [
1968
+ "device(type='cuda')"
1969
+ ]
1970
+ },
1971
+ "metadata": {},
1972
+ "execution_count": 17
1973
+ }
1974
+ ]
1975
+ },
1976
+ {
1977
+ "cell_type": "markdown",
1978
+ "source": [
1979
+ "# Train Model"
1980
+ ],
1981
+ "metadata": {
1982
+ "id": "uBKGyEdoKwWT"
1983
+ }
1984
+ },
1985
+ {
1986
+ "cell_type": "code",
1987
+ "source": [
1988
+ "# Define training arguments\n",
1989
+ "training_args = TrainingArguments(\n",
1990
+ " output_dir='./gpt2-evy',\n",
1991
+ " overwrite_output_dir=True,\n",
1992
+ " num_train_epochs=20,\n",
1993
+ " per_device_train_batch_size=8,\n",
1994
+ " evaluation_strategy=\"epoch\",\n",
1995
+ " eval_steps=1000,\n",
1996
+ " save_steps=1000,\n",
1997
+ " logging_steps=100,\n",
1998
+ " logging_dir='./logs',\n",
1999
+ " push_to_hub=True,\n",
2000
+ " # resume_from_checkpoint=\"./gpt2-evy/checkpoint-1900\"\n",
2001
+ ")\n",
2002
+ "\n",
2003
+ "trainer = Trainer(\n",
2004
+ " model=model,\n",
2005
+ " args=training_args,\n",
2006
+ " train_dataset=train_data,\n",
2007
+ " eval_dataset=val_data,\n",
2008
+ " tokenizer=tokenizer\n",
2009
+ ")\n",
2010
+ "\n",
2011
+ "trainer.train()"
2012
+ ],
2013
+ "metadata": {
2014
+ "colab": {
2015
+ "base_uri": "https://localhost:8080/",
2016
+ "height": 756
2017
+ },
2018
+ "id": "VQuBHSec_hjO",
2019
+ "outputId": "8d1db759-c959-4181-f258-abf486c22d0b"
2020
+ },
2021
+ "execution_count": 36,
2022
+ "outputs": [
2023
+ {
2024
+ "output_type": "display_data",
2025
+ "data": {
2026
+ "text/plain": [
2027
+ "<IPython.core.display.HTML object>"
2028
+ ],
2029
+ "text/html": [
2030
+ "\n",
2031
+ " <div>\n",
2032
+ " \n",
2033
+ " <progress value='140' max='140' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
2034
+ " [140/140 00:38, Epoch 20/20]\n",
2035
+ " </div>\n",
2036
+ " <table border=\"1\" class=\"dataframe\">\n",
2037
+ " <thead>\n",
2038
+ " <tr style=\"text-align: left;\">\n",
2039
+ " <th>Epoch</th>\n",
2040
+ " <th>Training Loss</th>\n",
2041
+ " <th>Validation Loss</th>\n",
2042
+ " </tr>\n",
2043
+ " </thead>\n",
2044
+ " <tbody>\n",
2045
+ " <tr>\n",
2046
+ " <td>1</td>\n",
2047
+ " <td>No log</td>\n",
2048
+ " <td>1.553022</td>\n",
2049
+ " </tr>\n",
2050
+ " <tr>\n",
2051
+ " <td>2</td>\n",
2052
+ " <td>No log</td>\n",
2053
+ " <td>1.460105</td>\n",
2054
+ " </tr>\n",
2055
+ " <tr>\n",
2056
+ " <td>3</td>\n",
2057
+ " <td>No log</td>\n",
2058
+ " <td>1.395301</td>\n",
2059
+ " </tr>\n",
2060
+ " <tr>\n",
2061
+ " <td>4</td>\n",
2062
+ " <td>No log</td>\n",
2063
+ " <td>1.355699</td>\n",
2064
+ " </tr>\n",
2065
+ " <tr>\n",
2066
+ " <td>5</td>\n",
2067
+ " <td>No log</td>\n",
2068
+ " <td>1.330109</td>\n",
2069
+ " </tr>\n",
2070
+ " <tr>\n",
2071
+ " <td>6</td>\n",
2072
+ " <td>No log</td>\n",
2073
+ " <td>1.311717</td>\n",
2074
+ " </tr>\n",
2075
+ " <tr>\n",
2076
+ " <td>7</td>\n",
2077
+ " <td>No log</td>\n",
2078
+ " <td>1.296761</td>\n",
2079
+ " </tr>\n",
2080
+ " <tr>\n",
2081
+ " <td>8</td>\n",
2082
+ " <td>No log</td>\n",
2083
+ " <td>1.283209</td>\n",
2084
+ " </tr>\n",
2085
+ " <tr>\n",
2086
+ " <td>9</td>\n",
2087
+ " <td>No log</td>\n",
2088
+ " <td>1.276882</td>\n",
2089
+ " </tr>\n",
2090
+ " <tr>\n",
2091
+ " <td>10</td>\n",
2092
+ " <td>No log</td>\n",
2093
+ " <td>1.280680</td>\n",
2094
+ " </tr>\n",
2095
+ " <tr>\n",
2096
+ " <td>11</td>\n",
2097
+ " <td>No log</td>\n",
2098
+ " <td>1.269814</td>\n",
2099
+ " </tr>\n",
2100
+ " <tr>\n",
2101
+ " <td>12</td>\n",
2102
+ " <td>No log</td>\n",
2103
+ " <td>1.270706</td>\n",
2104
+ " </tr>\n",
2105
+ " <tr>\n",
2106
+ " <td>13</td>\n",
2107
+ " <td>No log</td>\n",
2108
+ " <td>1.274694</td>\n",
2109
+ " </tr>\n",
2110
+ " <tr>\n",
2111
+ " <td>14</td>\n",
2112
+ " <td>No log</td>\n",
2113
+ " <td>1.269452</td>\n",
2114
+ " </tr>\n",
2115
+ " <tr>\n",
2116
+ " <td>15</td>\n",
2117
+ " <td>1.055700</td>\n",
2118
+ " <td>1.269921</td>\n",
2119
+ " </tr>\n",
2120
+ " <tr>\n",
2121
+ " <td>16</td>\n",
2122
+ " <td>1.055700</td>\n",
2123
+ " <td>1.265592</td>\n",
2124
+ " </tr>\n",
2125
+ " <tr>\n",
2126
+ " <td>17</td>\n",
2127
+ " <td>1.055700</td>\n",
2128
+ " <td>1.271150</td>\n",
2129
+ " </tr>\n",
2130
+ " <tr>\n",
2131
+ " <td>18</td>\n",
2132
+ " <td>1.055700</td>\n",
2133
+ " <td>1.269600</td>\n",
2134
+ " </tr>\n",
2135
+ " <tr>\n",
2136
+ " <td>19</td>\n",
2137
+ " <td>1.055700</td>\n",
2138
+ " <td>1.269069</td>\n",
2139
+ " </tr>\n",
2140
+ " <tr>\n",
2141
+ " <td>20</td>\n",
2142
+ " <td>1.055700</td>\n",
2143
+ " <td>1.269298</td>\n",
2144
+ " </tr>\n",
2145
+ " </tbody>\n",
2146
+ "</table><p>"
2147
+ ]
2148
+ },
2149
+ "metadata": {}
2150
+ },
2151
+ {
2152
+ "output_type": "execute_result",
2153
+ "data": {
2154
+ "text/plain": [
2155
+ "TrainOutput(global_step=140, training_loss=0.9502299581255231, metrics={'train_runtime': 38.6687, 'train_samples_per_second': 27.93, 'train_steps_per_second': 3.621, 'total_flos': 282195394560000.0, 'train_loss': 0.9502299581255231, 'epoch': 20.0})"
2156
+ ]
2157
+ },
2158
+ "metadata": {},
2159
+ "execution_count": 36
2160
+ }
2161
+ ]
2162
+ },
2163
+ {
2164
+ "cell_type": "markdown",
2165
+ "source": [
2166
+ "# Save Model"
2167
+ ],
2168
+ "metadata": {
2169
+ "id": "9RkdIyRfLNkW"
2170
+ }
2171
+ },
2172
+ {
2173
+ "cell_type": "code",
2174
+ "source": [
2175
+ "trainer.save_model()\n",
2176
+ "trainer.push_to_hub()\n",
2177
+ "tokenizer.push_to_hub(\"gpt2-evy\")"
2178
+ ],
2179
+ "metadata": {
2180
+ "id": "Mp0hvvAILPlQ",
2181
+ "colab": {
2182
+ "base_uri": "https://localhost:8080/",
2183
+ "height": 152,
2184
+ "referenced_widgets": [
2185
+ "f403a8090a6646a5b24bd3f1a482a466",
2186
+ "7c5e45acf4f44fbbbe42ba6ae0d1a00b",
2187
+ "241d22a572d14deeb99cf23d32b15437",
2188
+ "833282adf0374866a2e923ba2d89ed54",
2189
+ "92893ea5925a416496dbb5f0f6cc5fe4",
2190
+ "b965c7efbf2c4bb59f6d6339bca638aa",
2191
+ "8543bc719912446a956bc1df364892dc",
2192
+ "7df787a07b5442cf9995c0e239c65c25",
2193
+ "1b93b372a091455b90d7aee81706868d",
2194
+ "dccf8ecf30d94f3ca449bf2f681683c7",
2195
+ "0ffd8ed4d4e84c2eae4837978e6dfdcf",
2196
+ "1a8e5de3f44b4deb9815fe7dcac10f71",
2197
+ "15f90e6de63647a291899befc0912db8",
2198
+ "288e7c00f27b421388f23f1255d01f2d",
2199
+ "f57174571a494c4cb2074a904f3b86ce",
2200
+ "8eb37b23513e49679dd5f12554a66295",
2201
+ "de0b0d803dde4c8fa8bcd9eda5210420",
2202
+ "3be10b8fc42749fdb522f3168952b3ea",
2203
+ "d2895d4001b24dc6bc52f8ead03f77a3",
2204
+ "99962b09abe44dc7977f067371cf65ef",
2205
+ "e1434108affa47fa94b2680e72319099",
2206
+ "91d6a93bbb374189be6d6b8a62c8ab9b"
2207
+ ]
2208
+ },
2209
+ "outputId": "4b296348-4bf4-440d-eb74-219e15b5e032"
2210
+ },
2211
+ "execution_count": 37,
2212
+ "outputs": [
2213
+ {
2214
+ "output_type": "display_data",
2215
+ "data": {
2216
+ "text/plain": [
2217
+ "model.safetensors: 0%| | 0.00/498M [00:00<?, ?B/s]"
2218
+ ],
2219
+ "application/vnd.jupyter.widget-view+json": {
2220
+ "version_major": 2,
2221
+ "version_minor": 0,
2222
+ "model_id": "f403a8090a6646a5b24bd3f1a482a466"
2223
+ }
2224
+ },
2225
+ "metadata": {}
2226
+ },
2227
+ {
2228
+ "output_type": "display_data",
2229
+ "data": {
2230
+ "text/plain": [
2231
+ "README.md: 0%| | 0.00/2.19k [00:00<?, ?B/s]"
2232
+ ],
2233
+ "application/vnd.jupyter.widget-view+json": {
2234
+ "version_major": 2,
2235
+ "version_minor": 0,
2236
+ "model_id": "1a8e5de3f44b4deb9815fe7dcac10f71"
2237
+ }
2238
+ },
2239
+ "metadata": {}
2240
+ },
2241
+ {
2242
+ "output_type": "execute_result",
2243
+ "data": {
2244
+ "text/plain": [
2245
+ "CommitInfo(commit_url='https://huggingface.co/joshcarp/gpt2-evy/commit/c95869e260cd381e108a4f2ad1c6f3745a001a68', commit_message='Upload tokenizer', commit_description='', oid='c95869e260cd381e108a4f2ad1c6f3745a001a68', pr_url=None, pr_revision=None, pr_num=None)"
2246
+ ],
2247
+ "application/vnd.google.colaboratory.intrinsic+json": {
2248
+ "type": "string"
2249
+ }
2250
+ },
2251
+ "metadata": {},
2252
+ "execution_count": 37
2253
+ }
2254
+ ]
2255
+ }
2256
+ ]
2257
+ }