eremeev-d commited on
Commit
bc45729
·
1 Parent(s): 832fef5

Added notebooks

Browse files
Notebooks/ysda-ml-02-05-build-index.ipynb ADDED
@@ -0,0 +1,556 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 1,
6
+ "id": "0bb77379",
7
+ "metadata": {
8
+ "execution": {
9
+ "iopub.execute_input": "2023-04-17T05:48:17.537446Z",
10
+ "iopub.status.busy": "2023-04-17T05:48:17.536424Z",
11
+ "iopub.status.idle": "2023-04-17T05:48:31.651358Z",
12
+ "shell.execute_reply": "2023-04-17T05:48:31.649651Z"
13
+ },
14
+ "papermill": {
15
+ "duration": 14.123673,
16
+ "end_time": "2023-04-17T05:48:31.654609",
17
+ "exception": false,
18
+ "start_time": "2023-04-17T05:48:17.530936",
19
+ "status": "completed"
20
+ },
21
+ "tags": []
22
+ },
23
+ "outputs": [
24
+ {
25
+ "name": "stdout",
26
+ "output_type": "stream",
27
+ "text": [
28
+ "Collecting faiss-cpu\r\n",
29
+ " Downloading faiss_cpu-1.7.3-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (17.0 MB)\r\n",
30
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m17.0/17.0 MB\u001b[0m \u001b[31m42.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\r\n",
31
+ "\u001b[?25hInstalling collected packages: faiss-cpu\r\n",
32
+ "Successfully installed faiss-cpu-1.7.3\r\n",
33
+ "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\r\n",
34
+ "\u001b[0m"
35
+ ]
36
+ }
37
+ ],
38
+ "source": [
39
+ "!pip install faiss-cpu"
40
+ ]
41
+ },
42
+ {
43
+ "cell_type": "code",
44
+ "execution_count": 2,
45
+ "id": "3c9019a6",
46
+ "metadata": {
47
+ "execution": {
48
+ "iopub.execute_input": "2023-04-17T05:48:31.663539Z",
49
+ "iopub.status.busy": "2023-04-17T05:48:31.662590Z",
50
+ "iopub.status.idle": "2023-04-17T05:48:32.984952Z",
51
+ "shell.execute_reply": "2023-04-17T05:48:32.983413Z"
52
+ },
53
+ "papermill": {
54
+ "duration": 1.330221,
55
+ "end_time": "2023-04-17T05:48:32.988111",
56
+ "exception": false,
57
+ "start_time": "2023-04-17T05:48:31.657890",
58
+ "status": "completed"
59
+ },
60
+ "tags": []
61
+ },
62
+ "outputs": [],
63
+ "source": [
64
+ "import datasets\n",
65
+ "from datasets import Dataset\n",
66
+ "import numpy as np\n",
67
+ "import json\n",
68
+ "import os\n",
69
+ "from tqdm.notebook import tqdm as tqdm\n",
70
+ "import faiss\n",
71
+ "\n",
72
+ "ARTICLES_PATH = '/kaggle/input/ysda-ml-02-05-process-json/articles.hf'\n",
73
+ "EMBEDDINGS_PATH = '/kaggle/input/ysda-ml-02-05-generate-embeddings/embeddings.npy'\n",
74
+ "OUTPUT_PATH = '/kaggle/working/articles.index'"
75
+ ]
76
+ },
77
+ {
78
+ "cell_type": "code",
79
+ "execution_count": 3,
80
+ "id": "0271d205",
81
+ "metadata": {
82
+ "execution": {
83
+ "iopub.execute_input": "2023-04-17T05:48:32.997788Z",
84
+ "iopub.status.busy": "2023-04-17T05:48:32.996997Z",
85
+ "iopub.status.idle": "2023-04-17T05:48:47.446365Z",
86
+ "shell.execute_reply": "2023-04-17T05:48:47.445122Z"
87
+ },
88
+ "papermill": {
89
+ "duration": 14.457709,
90
+ "end_time": "2023-04-17T05:48:47.449394",
91
+ "exception": false,
92
+ "start_time": "2023-04-17T05:48:32.991685",
93
+ "status": "completed"
94
+ },
95
+ "tags": []
96
+ },
97
+ "outputs": [],
98
+ "source": [
99
+ "articles = Dataset.load_from_disk(ARTICLES_PATH)\n",
100
+ "embeddings = np.load(EMBEDDINGS_PATH)"
101
+ ]
102
+ },
103
+ {
104
+ "cell_type": "code",
105
+ "execution_count": 4,
106
+ "id": "7467da22",
107
+ "metadata": {
108
+ "execution": {
109
+ "iopub.execute_input": "2023-04-17T05:48:47.458217Z",
110
+ "iopub.status.busy": "2023-04-17T05:48:47.457678Z",
111
+ "iopub.status.idle": "2023-04-17T05:49:05.400026Z",
112
+ "shell.execute_reply": "2023-04-17T05:49:05.398641Z"
113
+ },
114
+ "papermill": {
115
+ "duration": 17.95023,
116
+ "end_time": "2023-04-17T05:49:05.402995",
117
+ "exception": false,
118
+ "start_time": "2023-04-17T05:48:47.452765",
119
+ "status": "completed"
120
+ },
121
+ "tags": []
122
+ },
123
+ "outputs": [
124
+ {
125
+ "data": {
126
+ "application/vnd.jupyter.widget-view+json": {
127
+ "model_id": "df6dfb9da874419d9783f7f156cd9963",
128
+ "version_major": 2,
129
+ "version_minor": 0
130
+ },
131
+ "text/plain": [
132
+ " 0%| | 0/2239 [00:00<?, ?it/s]"
133
+ ]
134
+ },
135
+ "metadata": {},
136
+ "output_type": "display_data"
137
+ }
138
+ ],
139
+ "source": [
140
+ "articles.add_faiss_index_from_external_arrays(\n",
141
+ " embeddings, \n",
142
+ " 'embedding', \n",
143
+ " metric_type=faiss.METRIC_INNER_PRODUCT\n",
144
+ ")"
145
+ ]
146
+ },
147
+ {
148
+ "cell_type": "code",
149
+ "execution_count": 5,
150
+ "id": "61bb1bd4",
151
+ "metadata": {
152
+ "execution": {
153
+ "iopub.execute_input": "2023-04-17T05:49:05.412042Z",
154
+ "iopub.status.busy": "2023-04-17T05:49:05.411098Z",
155
+ "iopub.status.idle": "2023-04-17T05:49:08.841963Z",
156
+ "shell.execute_reply": "2023-04-17T05:49:08.840974Z"
157
+ },
158
+ "papermill": {
159
+ "duration": 3.438676,
160
+ "end_time": "2023-04-17T05:49:08.845080",
161
+ "exception": false,
162
+ "start_time": "2023-04-17T05:49:05.406404",
163
+ "status": "completed"
164
+ },
165
+ "tags": []
166
+ },
167
+ "outputs": [],
168
+ "source": [
169
+ "articles.save_faiss_index('embedding', OUTPUT_PATH)"
170
+ ]
171
+ }
172
+ ],
173
+ "metadata": {
174
+ "kernelspec": {
175
+ "display_name": "Python 3",
176
+ "language": "python",
177
+ "name": "python3"
178
+ },
179
+ "language_info": {
180
+ "codemirror_mode": {
181
+ "name": "ipython",
182
+ "version": 3
183
+ },
184
+ "file_extension": ".py",
185
+ "mimetype": "text/x-python",
186
+ "name": "python",
187
+ "nbconvert_exporter": "python",
188
+ "pygments_lexer": "ipython3",
189
+ "version": "3.7.12"
190
+ },
191
+ "papermill": {
192
+ "default_parameters": {},
193
+ "duration": 63.431822,
194
+ "end_time": "2023-04-17T05:49:09.990990",
195
+ "environment_variables": {},
196
+ "exception": null,
197
+ "input_path": "__notebook__.ipynb",
198
+ "output_path": "__notebook__.ipynb",
199
+ "parameters": {},
200
+ "start_time": "2023-04-17T05:48:06.559168",
201
+ "version": "2.4.0"
202
+ },
203
+ "widgets": {
204
+ "application/vnd.jupyter.widget-state+json": {
205
+ "state": {
206
+ "0814242ff41d45b295efc66b88f34057": {
207
+ "model_module": "@jupyter-widgets/controls",
208
+ "model_module_version": "1.5.0",
209
+ "model_name": "HTMLModel",
210
+ "state": {
211
+ "_dom_classes": [],
212
+ "_model_module": "@jupyter-widgets/controls",
213
+ "_model_module_version": "1.5.0",
214
+ "_model_name": "HTMLModel",
215
+ "_view_count": null,
216
+ "_view_module": "@jupyter-widgets/controls",
217
+ "_view_module_version": "1.5.0",
218
+ "_view_name": "HTMLView",
219
+ "description": "",
220
+ "description_tooltip": null,
221
+ "layout": "IPY_MODEL_a317d1fc94a34dc6a569ef9655c2c5e6",
222
+ "placeholder": "​",
223
+ "style": "IPY_MODEL_0d730835a72d403f82a5c216ad4d13b4",
224
+ "value": " 2239/2239 [00:13&lt;00:00, 71.44it/s]"
225
+ }
226
+ },
227
+ "0d730835a72d403f82a5c216ad4d13b4": {
228
+ "model_module": "@jupyter-widgets/controls",
229
+ "model_module_version": "1.5.0",
230
+ "model_name": "DescriptionStyleModel",
231
+ "state": {
232
+ "_model_module": "@jupyter-widgets/controls",
233
+ "_model_module_version": "1.5.0",
234
+ "_model_name": "DescriptionStyleModel",
235
+ "_view_count": null,
236
+ "_view_module": "@jupyter-widgets/base",
237
+ "_view_module_version": "1.2.0",
238
+ "_view_name": "StyleView",
239
+ "description_width": ""
240
+ }
241
+ },
242
+ "16076bcc1f6644889fc4f2e3fce8bd88": {
243
+ "model_module": "@jupyter-widgets/controls",
244
+ "model_module_version": "1.5.0",
245
+ "model_name": "HTMLModel",
246
+ "state": {
247
+ "_dom_classes": [],
248
+ "_model_module": "@jupyter-widgets/controls",
249
+ "_model_module_version": "1.5.0",
250
+ "_model_name": "HTMLModel",
251
+ "_view_count": null,
252
+ "_view_module": "@jupyter-widgets/controls",
253
+ "_view_module_version": "1.5.0",
254
+ "_view_name": "HTMLView",
255
+ "description": "",
256
+ "description_tooltip": null,
257
+ "layout": "IPY_MODEL_21235b1f64e1452fa06a37afc94e37df",
258
+ "placeholder": "​",
259
+ "style": "IPY_MODEL_168f36f0d10a46d1b7e635237f18d601",
260
+ "value": "100%"
261
+ }
262
+ },
263
+ "168f36f0d10a46d1b7e635237f18d601": {
264
+ "model_module": "@jupyter-widgets/controls",
265
+ "model_module_version": "1.5.0",
266
+ "model_name": "DescriptionStyleModel",
267
+ "state": {
268
+ "_model_module": "@jupyter-widgets/controls",
269
+ "_model_module_version": "1.5.0",
270
+ "_model_name": "DescriptionStyleModel",
271
+ "_view_count": null,
272
+ "_view_module": "@jupyter-widgets/base",
273
+ "_view_module_version": "1.2.0",
274
+ "_view_name": "StyleView",
275
+ "description_width": ""
276
+ }
277
+ },
278
+ "1a5ebfbcfaa34421aa36d8139763c641": {
279
+ "model_module": "@jupyter-widgets/base",
280
+ "model_module_version": "1.2.0",
281
+ "model_name": "LayoutModel",
282
+ "state": {
283
+ "_model_module": "@jupyter-widgets/base",
284
+ "_model_module_version": "1.2.0",
285
+ "_model_name": "LayoutModel",
286
+ "_view_count": null,
287
+ "_view_module": "@jupyter-widgets/base",
288
+ "_view_module_version": "1.2.0",
289
+ "_view_name": "LayoutView",
290
+ "align_content": null,
291
+ "align_items": null,
292
+ "align_self": null,
293
+ "border": null,
294
+ "bottom": null,
295
+ "display": null,
296
+ "flex": null,
297
+ "flex_flow": null,
298
+ "grid_area": null,
299
+ "grid_auto_columns": null,
300
+ "grid_auto_flow": null,
301
+ "grid_auto_rows": null,
302
+ "grid_column": null,
303
+ "grid_gap": null,
304
+ "grid_row": null,
305
+ "grid_template_areas": null,
306
+ "grid_template_columns": null,
307
+ "grid_template_rows": null,
308
+ "height": null,
309
+ "justify_content": null,
310
+ "justify_items": null,
311
+ "left": null,
312
+ "margin": null,
313
+ "max_height": null,
314
+ "max_width": null,
315
+ "min_height": null,
316
+ "min_width": null,
317
+ "object_fit": null,
318
+ "object_position": null,
319
+ "order": null,
320
+ "overflow": null,
321
+ "overflow_x": null,
322
+ "overflow_y": null,
323
+ "padding": null,
324
+ "right": null,
325
+ "top": null,
326
+ "visibility": null,
327
+ "width": null
328
+ }
329
+ },
330
+ "21235b1f64e1452fa06a37afc94e37df": {
331
+ "model_module": "@jupyter-widgets/base",
332
+ "model_module_version": "1.2.0",
333
+ "model_name": "LayoutModel",
334
+ "state": {
335
+ "_model_module": "@jupyter-widgets/base",
336
+ "_model_module_version": "1.2.0",
337
+ "_model_name": "LayoutModel",
338
+ "_view_count": null,
339
+ "_view_module": "@jupyter-widgets/base",
340
+ "_view_module_version": "1.2.0",
341
+ "_view_name": "LayoutView",
342
+ "align_content": null,
343
+ "align_items": null,
344
+ "align_self": null,
345
+ "border": null,
346
+ "bottom": null,
347
+ "display": null,
348
+ "flex": null,
349
+ "flex_flow": null,
350
+ "grid_area": null,
351
+ "grid_auto_columns": null,
352
+ "grid_auto_flow": null,
353
+ "grid_auto_rows": null,
354
+ "grid_column": null,
355
+ "grid_gap": null,
356
+ "grid_row": null,
357
+ "grid_template_areas": null,
358
+ "grid_template_columns": null,
359
+ "grid_template_rows": null,
360
+ "height": null,
361
+ "justify_content": null,
362
+ "justify_items": null,
363
+ "left": null,
364
+ "margin": null,
365
+ "max_height": null,
366
+ "max_width": null,
367
+ "min_height": null,
368
+ "min_width": null,
369
+ "object_fit": null,
370
+ "object_position": null,
371
+ "order": null,
372
+ "overflow": null,
373
+ "overflow_x": null,
374
+ "overflow_y": null,
375
+ "padding": null,
376
+ "right": null,
377
+ "top": null,
378
+ "visibility": null,
379
+ "width": null
380
+ }
381
+ },
382
+ "6c34fbcfee584e5a840c617c8be1dd62": {
383
+ "model_module": "@jupyter-widgets/controls",
384
+ "model_module_version": "1.5.0",
385
+ "model_name": "FloatProgressModel",
386
+ "state": {
387
+ "_dom_classes": [],
388
+ "_model_module": "@jupyter-widgets/controls",
389
+ "_model_module_version": "1.5.0",
390
+ "_model_name": "FloatProgressModel",
391
+ "_view_count": null,
392
+ "_view_module": "@jupyter-widgets/controls",
393
+ "_view_module_version": "1.5.0",
394
+ "_view_name": "ProgressView",
395
+ "bar_style": "success",
396
+ "description": "",
397
+ "description_tooltip": null,
398
+ "layout": "IPY_MODEL_a0f7c5c2d54945458130ff18c60a4f3b",
399
+ "max": 2239.0,
400
+ "min": 0.0,
401
+ "orientation": "horizontal",
402
+ "style": "IPY_MODEL_8cf935e4c2f24f77a45173536fa142a7",
403
+ "value": 2239.0
404
+ }
405
+ },
406
+ "8cf935e4c2f24f77a45173536fa142a7": {
407
+ "model_module": "@jupyter-widgets/controls",
408
+ "model_module_version": "1.5.0",
409
+ "model_name": "ProgressStyleModel",
410
+ "state": {
411
+ "_model_module": "@jupyter-widgets/controls",
412
+ "_model_module_version": "1.5.0",
413
+ "_model_name": "ProgressStyleModel",
414
+ "_view_count": null,
415
+ "_view_module": "@jupyter-widgets/base",
416
+ "_view_module_version": "1.2.0",
417
+ "_view_name": "StyleView",
418
+ "bar_color": null,
419
+ "description_width": ""
420
+ }
421
+ },
422
+ "a0f7c5c2d54945458130ff18c60a4f3b": {
423
+ "model_module": "@jupyter-widgets/base",
424
+ "model_module_version": "1.2.0",
425
+ "model_name": "LayoutModel",
426
+ "state": {
427
+ "_model_module": "@jupyter-widgets/base",
428
+ "_model_module_version": "1.2.0",
429
+ "_model_name": "LayoutModel",
430
+ "_view_count": null,
431
+ "_view_module": "@jupyter-widgets/base",
432
+ "_view_module_version": "1.2.0",
433
+ "_view_name": "LayoutView",
434
+ "align_content": null,
435
+ "align_items": null,
436
+ "align_self": null,
437
+ "border": null,
438
+ "bottom": null,
439
+ "display": null,
440
+ "flex": null,
441
+ "flex_flow": null,
442
+ "grid_area": null,
443
+ "grid_auto_columns": null,
444
+ "grid_auto_flow": null,
445
+ "grid_auto_rows": null,
446
+ "grid_column": null,
447
+ "grid_gap": null,
448
+ "grid_row": null,
449
+ "grid_template_areas": null,
450
+ "grid_template_columns": null,
451
+ "grid_template_rows": null,
452
+ "height": null,
453
+ "justify_content": null,
454
+ "justify_items": null,
455
+ "left": null,
456
+ "margin": null,
457
+ "max_height": null,
458
+ "max_width": null,
459
+ "min_height": null,
460
+ "min_width": null,
461
+ "object_fit": null,
462
+ "object_position": null,
463
+ "order": null,
464
+ "overflow": null,
465
+ "overflow_x": null,
466
+ "overflow_y": null,
467
+ "padding": null,
468
+ "right": null,
469
+ "top": null,
470
+ "visibility": null,
471
+ "width": null
472
+ }
473
+ },
474
+ "a317d1fc94a34dc6a569ef9655c2c5e6": {
475
+ "model_module": "@jupyter-widgets/base",
476
+ "model_module_version": "1.2.0",
477
+ "model_name": "LayoutModel",
478
+ "state": {
479
+ "_model_module": "@jupyter-widgets/base",
480
+ "_model_module_version": "1.2.0",
481
+ "_model_name": "LayoutModel",
482
+ "_view_count": null,
483
+ "_view_module": "@jupyter-widgets/base",
484
+ "_view_module_version": "1.2.0",
485
+ "_view_name": "LayoutView",
486
+ "align_content": null,
487
+ "align_items": null,
488
+ "align_self": null,
489
+ "border": null,
490
+ "bottom": null,
491
+ "display": null,
492
+ "flex": null,
493
+ "flex_flow": null,
494
+ "grid_area": null,
495
+ "grid_auto_columns": null,
496
+ "grid_auto_flow": null,
497
+ "grid_auto_rows": null,
498
+ "grid_column": null,
499
+ "grid_gap": null,
500
+ "grid_row": null,
501
+ "grid_template_areas": null,
502
+ "grid_template_columns": null,
503
+ "grid_template_rows": null,
504
+ "height": null,
505
+ "justify_content": null,
506
+ "justify_items": null,
507
+ "left": null,
508
+ "margin": null,
509
+ "max_height": null,
510
+ "max_width": null,
511
+ "min_height": null,
512
+ "min_width": null,
513
+ "object_fit": null,
514
+ "object_position": null,
515
+ "order": null,
516
+ "overflow": null,
517
+ "overflow_x": null,
518
+ "overflow_y": null,
519
+ "padding": null,
520
+ "right": null,
521
+ "top": null,
522
+ "visibility": null,
523
+ "width": null
524
+ }
525
+ },
526
+ "df6dfb9da874419d9783f7f156cd9963": {
527
+ "model_module": "@jupyter-widgets/controls",
528
+ "model_module_version": "1.5.0",
529
+ "model_name": "HBoxModel",
530
+ "state": {
531
+ "_dom_classes": [],
532
+ "_model_module": "@jupyter-widgets/controls",
533
+ "_model_module_version": "1.5.0",
534
+ "_model_name": "HBoxModel",
535
+ "_view_count": null,
536
+ "_view_module": "@jupyter-widgets/controls",
537
+ "_view_module_version": "1.5.0",
538
+ "_view_name": "HBoxView",
539
+ "box_style": "",
540
+ "children": [
541
+ "IPY_MODEL_16076bcc1f6644889fc4f2e3fce8bd88",
542
+ "IPY_MODEL_6c34fbcfee584e5a840c617c8be1dd62",
543
+ "IPY_MODEL_0814242ff41d45b295efc66b88f34057"
544
+ ],
545
+ "layout": "IPY_MODEL_1a5ebfbcfaa34421aa36d8139763c641"
546
+ }
547
+ }
548
+ },
549
+ "version_major": 2,
550
+ "version_minor": 0
551
+ }
552
+ }
553
+ },
554
+ "nbformat": 4,
555
+ "nbformat_minor": 5
556
+ }
Notebooks/ysda-ml-02-05-finetune.ipynb ADDED
The diff for this file is too large to render. See raw diff
 
Notebooks/ysda-ml-02-05-generate-embeddings.ipynb ADDED
@@ -0,0 +1,2681 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 1,
6
+ "id": "5247856b",
7
+ "metadata": {
8
+ "_cell_guid": "b1076dfc-b9ad-4769-8c92-a6c4dae69d19",
9
+ "_uuid": "8f2839f25d086af736a60e9eeb907d3b93b6e0e5",
10
+ "execution": {
11
+ "iopub.execute_input": "2023-04-16T22:13:19.965100Z",
12
+ "iopub.status.busy": "2023-04-16T22:13:19.964059Z",
13
+ "iopub.status.idle": "2023-04-16T22:13:24.741753Z",
14
+ "shell.execute_reply": "2023-04-16T22:13:24.740665Z"
15
+ },
16
+ "papermill": {
17
+ "duration": 4.784228,
18
+ "end_time": "2023-04-16T22:13:24.744315",
19
+ "exception": false,
20
+ "start_time": "2023-04-16T22:13:19.960087",
21
+ "status": "completed"
22
+ },
23
+ "tags": []
24
+ },
25
+ "outputs": [],
26
+ "source": [
27
+ "import datasets\n",
28
+ "from datasets import Dataset\n",
29
+ "import numpy as np\n",
30
+ "import json\n",
31
+ "import os\n",
32
+ "from transformers import AutoTokenizer, AutoModel\n",
33
+ "import torch\n",
34
+ "import torch.nn.functional as F\n",
35
+ "from tqdm.notebook import tqdm as tqdm\n",
36
+ "\n",
37
+ "ARTICLES_PATH = '/kaggle/input/ysda-ml-02-05-process-json/articles.hf'\n",
38
+ "OUTPUT_PATH = '/kaggle/working/embeddings.npy'"
39
+ ]
40
+ },
41
+ {
42
+ "cell_type": "code",
43
+ "execution_count": 2,
44
+ "id": "e843dcbc",
45
+ "metadata": {
46
+ "execution": {
47
+ "iopub.execute_input": "2023-04-16T22:13:24.750354Z",
48
+ "iopub.status.busy": "2023-04-16T22:13:24.749123Z",
49
+ "iopub.status.idle": "2023-04-16T22:13:31.724234Z",
50
+ "shell.execute_reply": "2023-04-16T22:13:31.723052Z"
51
+ },
52
+ "papermill": {
53
+ "duration": 6.980451,
54
+ "end_time": "2023-04-16T22:13:31.726848",
55
+ "exception": false,
56
+ "start_time": "2023-04-16T22:13:24.746397",
57
+ "status": "completed"
58
+ },
59
+ "tags": []
60
+ },
61
+ "outputs": [
62
+ {
63
+ "data": {
64
+ "application/vnd.jupyter.widget-view+json": {
65
+ "model_id": "bf7e94fe0aba40cea4d15a6f598be1ea",
66
+ "version_major": 2,
67
+ "version_minor": 0
68
+ },
69
+ "text/plain": [
70
+ "Downloading (…)okenizer_config.json: 0%| | 0.00/350 [00:00<?, ?B/s]"
71
+ ]
72
+ },
73
+ "metadata": {},
74
+ "output_type": "display_data"
75
+ },
76
+ {
77
+ "data": {
78
+ "application/vnd.jupyter.widget-view+json": {
79
+ "model_id": "d450a5a84ea04020a24228c4acd81696",
80
+ "version_major": 2,
81
+ "version_minor": 0
82
+ },
83
+ "text/plain": [
84
+ "Downloading (…)solve/main/vocab.txt: 0%| | 0.00/232k [00:00<?, ?B/s]"
85
+ ]
86
+ },
87
+ "metadata": {},
88
+ "output_type": "display_data"
89
+ },
90
+ {
91
+ "data": {
92
+ "application/vnd.jupyter.widget-view+json": {
93
+ "model_id": "bb422963eb084ec783bfcf190950a2f0",
94
+ "version_major": 2,
95
+ "version_minor": 0
96
+ },
97
+ "text/plain": [
98
+ "Downloading (…)/main/tokenizer.json: 0%| | 0.00/466k [00:00<?, ?B/s]"
99
+ ]
100
+ },
101
+ "metadata": {},
102
+ "output_type": "display_data"
103
+ },
104
+ {
105
+ "data": {
106
+ "application/vnd.jupyter.widget-view+json": {
107
+ "model_id": "7876aff2f3d24a53af0c20e4d6ba1c94",
108
+ "version_major": 2,
109
+ "version_minor": 0
110
+ },
111
+ "text/plain": [
112
+ "Downloading (…)cial_tokens_map.json: 0%| | 0.00/112 [00:00<?, ?B/s]"
113
+ ]
114
+ },
115
+ "metadata": {},
116
+ "output_type": "display_data"
117
+ },
118
+ {
119
+ "data": {
120
+ "application/vnd.jupyter.widget-view+json": {
121
+ "model_id": "03a375ebd135477487e4ebbf003e3308",
122
+ "version_major": 2,
123
+ "version_minor": 0
124
+ },
125
+ "text/plain": [
126
+ "Downloading (…)lve/main/config.json: 0%| | 0.00/612 [00:00<?, ?B/s]"
127
+ ]
128
+ },
129
+ "metadata": {},
130
+ "output_type": "display_data"
131
+ },
132
+ {
133
+ "data": {
134
+ "application/vnd.jupyter.widget-view+json": {
135
+ "model_id": "1246cc73517b40b9825c90feb26d9f52",
136
+ "version_major": 2,
137
+ "version_minor": 0
138
+ },
139
+ "text/plain": [
140
+ "Downloading pytorch_model.bin: 0%| | 0.00/90.9M [00:00<?, ?B/s]"
141
+ ]
142
+ },
143
+ "metadata": {},
144
+ "output_type": "display_data"
145
+ }
146
+ ],
147
+ "source": [
148
+ "device = torch.device('cuda:0')\n",
149
+ "tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/all-MiniLM-L6-v2')\n",
150
+ "model = AutoModel.from_pretrained('sentence-transformers/all-MiniLM-L6-v2').to(device)"
151
+ ]
152
+ },
153
+ {
154
+ "cell_type": "code",
155
+ "execution_count": 3,
156
+ "id": "0939de26",
157
+ "metadata": {
158
+ "execution": {
159
+ "iopub.execute_input": "2023-04-16T22:13:31.734282Z",
160
+ "iopub.status.busy": "2023-04-16T22:13:31.733328Z",
161
+ "iopub.status.idle": "2023-04-16T22:13:31.743177Z",
162
+ "shell.execute_reply": "2023-04-16T22:13:31.742172Z"
163
+ },
164
+ "papermill": {
165
+ "duration": 0.015718,
166
+ "end_time": "2023-04-16T22:13:31.745331",
167
+ "exception": false,
168
+ "start_time": "2023-04-16T22:13:31.729613",
169
+ "status": "completed"
170
+ },
171
+ "tags": []
172
+ },
173
+ "outputs": [],
174
+ "source": [
175
+ "def mean_pooling(model_output, attention_mask):\n",
176
+ " token_embeddings = model_output[0]\n",
177
+ " input_mask_expanded = attention_mask.unsqueeze(-1) \\\n",
178
+ " .expand(token_embeddings.size()).float()\n",
179
+ " return torch.sum(token_embeddings * input_mask_expanded, 1) \\\n",
180
+ " / torch.clamp(input_mask_expanded.sum(1), min=1e-9)\n",
181
+ "\n",
182
+ "\n",
183
+ "def get_embedding(query, model, tokenizer):\n",
184
+ " encoded_input = tokenizer(\n",
185
+ " query, padding=True, truncation=True, return_tensors='pt'\n",
186
+ " ).to(device)\n",
187
+ " with torch.no_grad():\n",
188
+ " embeds = model(**encoded_input)\n",
189
+ " embeds = mean_pooling(embeds, encoded_input['attention_mask']).cpu()\n",
190
+ " embeds = F.normalize(embeds, p=2, dim=1)\n",
191
+ " return embeds.numpy().astype(np.float16)\n",
192
+ "\n",
193
+ "\n",
194
+ "def generate_embeddings(articles, batch_size):\n",
195
+ " embeddings = []\n",
196
+ " for batch in tqdm(range(0, len(articles['id']), batch_size)):\n",
197
+ " batch_abstracts = articles['abstract'][batch:batch+batch_size]\n",
198
+ " batch_embeddings = get_embedding(batch_abstracts, model, tokenizer)\n",
199
+ " embeddings.extend(list(batch_embeddings))\n",
200
+ " return embeddings"
201
+ ]
202
+ },
203
+ {
204
+ "cell_type": "code",
205
+ "execution_count": 4,
206
+ "id": "4f554901",
207
+ "metadata": {
208
+ "execution": {
209
+ "iopub.execute_input": "2023-04-16T22:13:31.751693Z",
210
+ "iopub.status.busy": "2023-04-16T22:13:31.751127Z",
211
+ "iopub.status.idle": "2023-04-17T00:38:19.371165Z",
212
+ "shell.execute_reply": "2023-04-17T00:38:19.369968Z"
213
+ },
214
+ "papermill": {
215
+ "duration": 8687.626574,
216
+ "end_time": "2023-04-17T00:38:19.374306",
217
+ "exception": false,
218
+ "start_time": "2023-04-16T22:13:31.747732",
219
+ "status": "completed"
220
+ },
221
+ "tags": []
222
+ },
223
+ "outputs": [
224
+ {
225
+ "data": {
226
+ "application/vnd.jupyter.widget-view+json": {
227
+ "model_id": "14127d5e851e4e77a15525d27f2ab349",
228
+ "version_major": 2,
229
+ "version_minor": 0
230
+ },
231
+ "text/plain": [
232
+ " 0%| | 0/17492 [00:00<?, ?it/s]"
233
+ ]
234
+ },
235
+ "metadata": {},
236
+ "output_type": "display_data"
237
+ }
238
+ ],
239
+ "source": [
240
+ "articles = Dataset.load_from_disk(ARTICLES_PATH).to_dict()\n",
241
+ "embeddings = generate_embeddings(articles, batch_size=128)\n",
242
+ "np.save(OUTPUT_PATH, embeddings)"
243
+ ]
244
+ }
245
+ ],
246
+ "metadata": {
247
+ "kernelspec": {
248
+ "display_name": "Python 3",
249
+ "language": "python",
250
+ "name": "python3"
251
+ },
252
+ "language_info": {
253
+ "codemirror_mode": {
254
+ "name": "ipython",
255
+ "version": 3
256
+ },
257
+ "file_extension": ".py",
258
+ "mimetype": "text/x-python",
259
+ "name": "python",
260
+ "nbconvert_exporter": "python",
261
+ "pygments_lexer": "ipython3",
262
+ "version": "3.7.12"
263
+ },
264
+ "papermill": {
265
+ "default_parameters": {},
266
+ "duration": 8712.753965,
267
+ "end_time": "2023-04-17T00:38:23.520517",
268
+ "environment_variables": {},
269
+ "exception": null,
270
+ "input_path": "__notebook__.ipynb",
271
+ "output_path": "__notebook__.ipynb",
272
+ "parameters": {},
273
+ "start_time": "2023-04-16T22:13:10.766552",
274
+ "version": "2.4.0"
275
+ },
276
+ "widgets": {
277
+ "application/vnd.jupyter.widget-state+json": {
278
+ "state": {
279
+ "015ee89d5e874c818cdaff8a2f05c22d": {
280
+ "model_module": "@jupyter-widgets/base",
281
+ "model_module_version": "1.2.0",
282
+ "model_name": "LayoutModel",
283
+ "state": {
284
+ "_model_module": "@jupyter-widgets/base",
285
+ "_model_module_version": "1.2.0",
286
+ "_model_name": "LayoutModel",
287
+ "_view_count": null,
288
+ "_view_module": "@jupyter-widgets/base",
289
+ "_view_module_version": "1.2.0",
290
+ "_view_name": "LayoutView",
291
+ "align_content": null,
292
+ "align_items": null,
293
+ "align_self": null,
294
+ "border": null,
295
+ "bottom": null,
296
+ "display": null,
297
+ "flex": null,
298
+ "flex_flow": null,
299
+ "grid_area": null,
300
+ "grid_auto_columns": null,
301
+ "grid_auto_flow": null,
302
+ "grid_auto_rows": null,
303
+ "grid_column": null,
304
+ "grid_gap": null,
305
+ "grid_row": null,
306
+ "grid_template_areas": null,
307
+ "grid_template_columns": null,
308
+ "grid_template_rows": null,
309
+ "height": null,
310
+ "justify_content": null,
311
+ "justify_items": null,
312
+ "left": null,
313
+ "margin": null,
314
+ "max_height": null,
315
+ "max_width": null,
316
+ "min_height": null,
317
+ "min_width": null,
318
+ "object_fit": null,
319
+ "object_position": null,
320
+ "order": null,
321
+ "overflow": null,
322
+ "overflow_x": null,
323
+ "overflow_y": null,
324
+ "padding": null,
325
+ "right": null,
326
+ "top": null,
327
+ "visibility": null,
328
+ "width": null
329
+ }
330
+ },
331
+ "03a375ebd135477487e4ebbf003e3308": {
332
+ "model_module": "@jupyter-widgets/controls",
333
+ "model_module_version": "1.5.0",
334
+ "model_name": "HBoxModel",
335
+ "state": {
336
+ "_dom_classes": [],
337
+ "_model_module": "@jupyter-widgets/controls",
338
+ "_model_module_version": "1.5.0",
339
+ "_model_name": "HBoxModel",
340
+ "_view_count": null,
341
+ "_view_module": "@jupyter-widgets/controls",
342
+ "_view_module_version": "1.5.0",
343
+ "_view_name": "HBoxView",
344
+ "box_style": "",
345
+ "children": [
346
+ "IPY_MODEL_7bbe332d901749c1ab35e01ead65b105",
347
+ "IPY_MODEL_e380ed94e29a4ceda0dee6b8da910a12",
348
+ "IPY_MODEL_6a4ad7e517e347d282b9e2674624b7e7"
349
+ ],
350
+ "layout": "IPY_MODEL_38e5a6017a5f43d088c9d62d46069ff6"
351
+ }
352
+ },
353
+ "04a4e4d8e06c4dc8a0220e79c81f48e3": {
354
+ "model_module": "@jupyter-widgets/base",
355
+ "model_module_version": "1.2.0",
356
+ "model_name": "LayoutModel",
357
+ "state": {
358
+ "_model_module": "@jupyter-widgets/base",
359
+ "_model_module_version": "1.2.0",
360
+ "_model_name": "LayoutModel",
361
+ "_view_count": null,
362
+ "_view_module": "@jupyter-widgets/base",
363
+ "_view_module_version": "1.2.0",
364
+ "_view_name": "LayoutView",
365
+ "align_content": null,
366
+ "align_items": null,
367
+ "align_self": null,
368
+ "border": null,
369
+ "bottom": null,
370
+ "display": null,
371
+ "flex": null,
372
+ "flex_flow": null,
373
+ "grid_area": null,
374
+ "grid_auto_columns": null,
375
+ "grid_auto_flow": null,
376
+ "grid_auto_rows": null,
377
+ "grid_column": null,
378
+ "grid_gap": null,
379
+ "grid_row": null,
380
+ "grid_template_areas": null,
381
+ "grid_template_columns": null,
382
+ "grid_template_rows": null,
383
+ "height": null,
384
+ "justify_content": null,
385
+ "justify_items": null,
386
+ "left": null,
387
+ "margin": null,
388
+ "max_height": null,
389
+ "max_width": null,
390
+ "min_height": null,
391
+ "min_width": null,
392
+ "object_fit": null,
393
+ "object_position": null,
394
+ "order": null,
395
+ "overflow": null,
396
+ "overflow_x": null,
397
+ "overflow_y": null,
398
+ "padding": null,
399
+ "right": null,
400
+ "top": null,
401
+ "visibility": null,
402
+ "width": null
403
+ }
404
+ },
405
+ "0703099941d34ae3a9477b7d8e741cc5": {
406
+ "model_module": "@jupyter-widgets/controls",
407
+ "model_module_version": "1.5.0",
408
+ "model_name": "FloatProgressModel",
409
+ "state": {
410
+ "_dom_classes": [],
411
+ "_model_module": "@jupyter-widgets/controls",
412
+ "_model_module_version": "1.5.0",
413
+ "_model_name": "FloatProgressModel",
414
+ "_view_count": null,
415
+ "_view_module": "@jupyter-widgets/controls",
416
+ "_view_module_version": "1.5.0",
417
+ "_view_name": "ProgressView",
418
+ "bar_style": "success",
419
+ "description": "",
420
+ "description_tooltip": null,
421
+ "layout": "IPY_MODEL_129676621768495d9b8f496870ec3861",
422
+ "max": 17492.0,
423
+ "min": 0.0,
424
+ "orientation": "horizontal",
425
+ "style": "IPY_MODEL_75e40a7c6b9e4941abeb7bd46bab91ed",
426
+ "value": 17492.0
427
+ }
428
+ },
429
+ "0804cfeca1a6489b930b877613bc6dcb": {
430
+ "model_module": "@jupyter-widgets/controls",
431
+ "model_module_version": "1.5.0",
432
+ "model_name": "DescriptionStyleModel",
433
+ "state": {
434
+ "_model_module": "@jupyter-widgets/controls",
435
+ "_model_module_version": "1.5.0",
436
+ "_model_name": "DescriptionStyleModel",
437
+ "_view_count": null,
438
+ "_view_module": "@jupyter-widgets/base",
439
+ "_view_module_version": "1.2.0",
440
+ "_view_name": "StyleView",
441
+ "description_width": ""
442
+ }
443
+ },
444
+ "089281cd484c4889b2cddd3ee55aad6e": {
445
+ "model_module": "@jupyter-widgets/controls",
446
+ "model_module_version": "1.5.0",
447
+ "model_name": "HTMLModel",
448
+ "state": {
449
+ "_dom_classes": [],
450
+ "_model_module": "@jupyter-widgets/controls",
451
+ "_model_module_version": "1.5.0",
452
+ "_model_name": "HTMLModel",
453
+ "_view_count": null,
454
+ "_view_module": "@jupyter-widgets/controls",
455
+ "_view_module_version": "1.5.0",
456
+ "_view_name": "HTMLView",
457
+ "description": "",
458
+ "description_tooltip": null,
459
+ "layout": "IPY_MODEL_8dde647640d14d77971154ec85674a6b",
460
+ "placeholder": "​",
461
+ "style": "IPY_MODEL_6bd547c8fa4745ff814c526e3c5f67ff",
462
+ "value": " 112/112 [00:00&lt;00:00, 7.18kB/s]"
463
+ }
464
+ },
465
+ "0c559307133043619b80d489c7970617": {
466
+ "model_module": "@jupyter-widgets/base",
467
+ "model_module_version": "1.2.0",
468
+ "model_name": "LayoutModel",
469
+ "state": {
470
+ "_model_module": "@jupyter-widgets/base",
471
+ "_model_module_version": "1.2.0",
472
+ "_model_name": "LayoutModel",
473
+ "_view_count": null,
474
+ "_view_module": "@jupyter-widgets/base",
475
+ "_view_module_version": "1.2.0",
476
+ "_view_name": "LayoutView",
477
+ "align_content": null,
478
+ "align_items": null,
479
+ "align_self": null,
480
+ "border": null,
481
+ "bottom": null,
482
+ "display": null,
483
+ "flex": null,
484
+ "flex_flow": null,
485
+ "grid_area": null,
486
+ "grid_auto_columns": null,
487
+ "grid_auto_flow": null,
488
+ "grid_auto_rows": null,
489
+ "grid_column": null,
490
+ "grid_gap": null,
491
+ "grid_row": null,
492
+ "grid_template_areas": null,
493
+ "grid_template_columns": null,
494
+ "grid_template_rows": null,
495
+ "height": null,
496
+ "justify_content": null,
497
+ "justify_items": null,
498
+ "left": null,
499
+ "margin": null,
500
+ "max_height": null,
501
+ "max_width": null,
502
+ "min_height": null,
503
+ "min_width": null,
504
+ "object_fit": null,
505
+ "object_position": null,
506
+ "order": null,
507
+ "overflow": null,
508
+ "overflow_x": null,
509
+ "overflow_y": null,
510
+ "padding": null,
511
+ "right": null,
512
+ "top": null,
513
+ "visibility": null,
514
+ "width": null
515
+ }
516
+ },
517
+ "1017fcfb8a8e4f05b7f170ea647f9153": {
518
+ "model_module": "@jupyter-widgets/controls",
519
+ "model_module_version": "1.5.0",
520
+ "model_name": "DescriptionStyleModel",
521
+ "state": {
522
+ "_model_module": "@jupyter-widgets/controls",
523
+ "_model_module_version": "1.5.0",
524
+ "_model_name": "DescriptionStyleModel",
525
+ "_view_count": null,
526
+ "_view_module": "@jupyter-widgets/base",
527
+ "_view_module_version": "1.2.0",
528
+ "_view_name": "StyleView",
529
+ "description_width": ""
530
+ }
531
+ },
532
+ "12095e20ae504e7d9fff53cd8baca6a8": {
533
+ "model_module": "@jupyter-widgets/controls",
534
+ "model_module_version": "1.5.0",
535
+ "model_name": "HTMLModel",
536
+ "state": {
537
+ "_dom_classes": [],
538
+ "_model_module": "@jupyter-widgets/controls",
539
+ "_model_module_version": "1.5.0",
540
+ "_model_name": "HTMLModel",
541
+ "_view_count": null,
542
+ "_view_module": "@jupyter-widgets/controls",
543
+ "_view_module_version": "1.5.0",
544
+ "_view_name": "HTMLView",
545
+ "description": "",
546
+ "description_tooltip": null,
547
+ "layout": "IPY_MODEL_728389ff6763493a8c0f0bb1de66fadc",
548
+ "placeholder": "​",
549
+ "style": "IPY_MODEL_dee5ee6686494be8b7be41e01576cd77",
550
+ "value": "Downloading (…)cial_tokens_map.json: 100%"
551
+ }
552
+ },
553
+ "1246cc73517b40b9825c90feb26d9f52": {
554
+ "model_module": "@jupyter-widgets/controls",
555
+ "model_module_version": "1.5.0",
556
+ "model_name": "HBoxModel",
557
+ "state": {
558
+ "_dom_classes": [],
559
+ "_model_module": "@jupyter-widgets/controls",
560
+ "_model_module_version": "1.5.0",
561
+ "_model_name": "HBoxModel",
562
+ "_view_count": null,
563
+ "_view_module": "@jupyter-widgets/controls",
564
+ "_view_module_version": "1.5.0",
565
+ "_view_name": "HBoxView",
566
+ "box_style": "",
567
+ "children": [
568
+ "IPY_MODEL_73eec9d7aad24824ab878ec617b9f4a8",
569
+ "IPY_MODEL_fe2339e92ef34a669751ef54d20b09fd",
570
+ "IPY_MODEL_ec9c1d9e2d7e4c38955ed3455ea216f6"
571
+ ],
572
+ "layout": "IPY_MODEL_b5ee209943d746a9a47ce936a9d10475"
573
+ }
574
+ },
575
+ "129676621768495d9b8f496870ec3861": {
576
+ "model_module": "@jupyter-widgets/base",
577
+ "model_module_version": "1.2.0",
578
+ "model_name": "LayoutModel",
579
+ "state": {
580
+ "_model_module": "@jupyter-widgets/base",
581
+ "_model_module_version": "1.2.0",
582
+ "_model_name": "LayoutModel",
583
+ "_view_count": null,
584
+ "_view_module": "@jupyter-widgets/base",
585
+ "_view_module_version": "1.2.0",
586
+ "_view_name": "LayoutView",
587
+ "align_content": null,
588
+ "align_items": null,
589
+ "align_self": null,
590
+ "border": null,
591
+ "bottom": null,
592
+ "display": null,
593
+ "flex": null,
594
+ "flex_flow": null,
595
+ "grid_area": null,
596
+ "grid_auto_columns": null,
597
+ "grid_auto_flow": null,
598
+ "grid_auto_rows": null,
599
+ "grid_column": null,
600
+ "grid_gap": null,
601
+ "grid_row": null,
602
+ "grid_template_areas": null,
603
+ "grid_template_columns": null,
604
+ "grid_template_rows": null,
605
+ "height": null,
606
+ "justify_content": null,
607
+ "justify_items": null,
608
+ "left": null,
609
+ "margin": null,
610
+ "max_height": null,
611
+ "max_width": null,
612
+ "min_height": null,
613
+ "min_width": null,
614
+ "object_fit": null,
615
+ "object_position": null,
616
+ "order": null,
617
+ "overflow": null,
618
+ "overflow_x": null,
619
+ "overflow_y": null,
620
+ "padding": null,
621
+ "right": null,
622
+ "top": null,
623
+ "visibility": null,
624
+ "width": null
625
+ }
626
+ },
627
+ "14127d5e851e4e77a15525d27f2ab349": {
628
+ "model_module": "@jupyter-widgets/controls",
629
+ "model_module_version": "1.5.0",
630
+ "model_name": "HBoxModel",
631
+ "state": {
632
+ "_dom_classes": [],
633
+ "_model_module": "@jupyter-widgets/controls",
634
+ "_model_module_version": "1.5.0",
635
+ "_model_name": "HBoxModel",
636
+ "_view_count": null,
637
+ "_view_module": "@jupyter-widgets/controls",
638
+ "_view_module_version": "1.5.0",
639
+ "_view_name": "HBoxView",
640
+ "box_style": "",
641
+ "children": [
642
+ "IPY_MODEL_76c21e9959a746ff844d3c3cee8f4dba",
643
+ "IPY_MODEL_0703099941d34ae3a9477b7d8e741cc5",
644
+ "IPY_MODEL_9ddd368390d949c6b4fb40463871ba01"
645
+ ],
646
+ "layout": "IPY_MODEL_bda35a315662410fb7b68d63b56c5cfc"
647
+ }
648
+ },
649
+ "151ab56449e8416cb04ce3d0be5d8899": {
650
+ "model_module": "@jupyter-widgets/controls",
651
+ "model_module_version": "1.5.0",
652
+ "model_name": "HTMLModel",
653
+ "state": {
654
+ "_dom_classes": [],
655
+ "_model_module": "@jupyter-widgets/controls",
656
+ "_model_module_version": "1.5.0",
657
+ "_model_name": "HTMLModel",
658
+ "_view_count": null,
659
+ "_view_module": "@jupyter-widgets/controls",
660
+ "_view_module_version": "1.5.0",
661
+ "_view_name": "HTMLView",
662
+ "description": "",
663
+ "description_tooltip": null,
664
+ "layout": "IPY_MODEL_5867a9979abc4440a64d1894199a2704",
665
+ "placeholder": "​",
666
+ "style": "IPY_MODEL_bee95ee151074c8f99728c877d60b16e",
667
+ "value": " 232k/232k [00:00&lt;00:00, 5.37MB/s]"
668
+ }
669
+ },
670
+ "2004f819be47491a933ea34bd72cfcc1": {
671
+ "model_module": "@jupyter-widgets/controls",
672
+ "model_module_version": "1.5.0",
673
+ "model_name": "HTMLModel",
674
+ "state": {
675
+ "_dom_classes": [],
676
+ "_model_module": "@jupyter-widgets/controls",
677
+ "_model_module_version": "1.5.0",
678
+ "_model_name": "HTMLModel",
679
+ "_view_count": null,
680
+ "_view_module": "@jupyter-widgets/controls",
681
+ "_view_module_version": "1.5.0",
682
+ "_view_name": "HTMLView",
683
+ "description": "",
684
+ "description_tooltip": null,
685
+ "layout": "IPY_MODEL_8bd5b0abca4e4b1ab2a4dc575319b6a9",
686
+ "placeholder": "​",
687
+ "style": "IPY_MODEL_739bafcd739241aaa5f2992176c85e58",
688
+ "value": "Downloading (…)okenizer_config.json: 100%"
689
+ }
690
+ },
691
+ "20cac87ded1444e4818e0448ab7748c2": {
692
+ "model_module": "@jupyter-widgets/base",
693
+ "model_module_version": "1.2.0",
694
+ "model_name": "LayoutModel",
695
+ "state": {
696
+ "_model_module": "@jupyter-widgets/base",
697
+ "_model_module_version": "1.2.0",
698
+ "_model_name": "LayoutModel",
699
+ "_view_count": null,
700
+ "_view_module": "@jupyter-widgets/base",
701
+ "_view_module_version": "1.2.0",
702
+ "_view_name": "LayoutView",
703
+ "align_content": null,
704
+ "align_items": null,
705
+ "align_self": null,
706
+ "border": null,
707
+ "bottom": null,
708
+ "display": null,
709
+ "flex": null,
710
+ "flex_flow": null,
711
+ "grid_area": null,
712
+ "grid_auto_columns": null,
713
+ "grid_auto_flow": null,
714
+ "grid_auto_rows": null,
715
+ "grid_column": null,
716
+ "grid_gap": null,
717
+ "grid_row": null,
718
+ "grid_template_areas": null,
719
+ "grid_template_columns": null,
720
+ "grid_template_rows": null,
721
+ "height": null,
722
+ "justify_content": null,
723
+ "justify_items": null,
724
+ "left": null,
725
+ "margin": null,
726
+ "max_height": null,
727
+ "max_width": null,
728
+ "min_height": null,
729
+ "min_width": null,
730
+ "object_fit": null,
731
+ "object_position": null,
732
+ "order": null,
733
+ "overflow": null,
734
+ "overflow_x": null,
735
+ "overflow_y": null,
736
+ "padding": null,
737
+ "right": null,
738
+ "top": null,
739
+ "visibility": null,
740
+ "width": null
741
+ }
742
+ },
743
+ "24bf29b8f9384543ba43093895045582": {
744
+ "model_module": "@jupyter-widgets/base",
745
+ "model_module_version": "1.2.0",
746
+ "model_name": "LayoutModel",
747
+ "state": {
748
+ "_model_module": "@jupyter-widgets/base",
749
+ "_model_module_version": "1.2.0",
750
+ "_model_name": "LayoutModel",
751
+ "_view_count": null,
752
+ "_view_module": "@jupyter-widgets/base",
753
+ "_view_module_version": "1.2.0",
754
+ "_view_name": "LayoutView",
755
+ "align_content": null,
756
+ "align_items": null,
757
+ "align_self": null,
758
+ "border": null,
759
+ "bottom": null,
760
+ "display": null,
761
+ "flex": null,
762
+ "flex_flow": null,
763
+ "grid_area": null,
764
+ "grid_auto_columns": null,
765
+ "grid_auto_flow": null,
766
+ "grid_auto_rows": null,
767
+ "grid_column": null,
768
+ "grid_gap": null,
769
+ "grid_row": null,
770
+ "grid_template_areas": null,
771
+ "grid_template_columns": null,
772
+ "grid_template_rows": null,
773
+ "height": null,
774
+ "justify_content": null,
775
+ "justify_items": null,
776
+ "left": null,
777
+ "margin": null,
778
+ "max_height": null,
779
+ "max_width": null,
780
+ "min_height": null,
781
+ "min_width": null,
782
+ "object_fit": null,
783
+ "object_position": null,
784
+ "order": null,
785
+ "overflow": null,
786
+ "overflow_x": null,
787
+ "overflow_y": null,
788
+ "padding": null,
789
+ "right": null,
790
+ "top": null,
791
+ "visibility": null,
792
+ "width": null
793
+ }
794
+ },
795
+ "2842c25aef774a7b9eab85c90f18b933": {
796
+ "model_module": "@jupyter-widgets/base",
797
+ "model_module_version": "1.2.0",
798
+ "model_name": "LayoutModel",
799
+ "state": {
800
+ "_model_module": "@jupyter-widgets/base",
801
+ "_model_module_version": "1.2.0",
802
+ "_model_name": "LayoutModel",
803
+ "_view_count": null,
804
+ "_view_module": "@jupyter-widgets/base",
805
+ "_view_module_version": "1.2.0",
806
+ "_view_name": "LayoutView",
807
+ "align_content": null,
808
+ "align_items": null,
809
+ "align_self": null,
810
+ "border": null,
811
+ "bottom": null,
812
+ "display": null,
813
+ "flex": null,
814
+ "flex_flow": null,
815
+ "grid_area": null,
816
+ "grid_auto_columns": null,
817
+ "grid_auto_flow": null,
818
+ "grid_auto_rows": null,
819
+ "grid_column": null,
820
+ "grid_gap": null,
821
+ "grid_row": null,
822
+ "grid_template_areas": null,
823
+ "grid_template_columns": null,
824
+ "grid_template_rows": null,
825
+ "height": null,
826
+ "justify_content": null,
827
+ "justify_items": null,
828
+ "left": null,
829
+ "margin": null,
830
+ "max_height": null,
831
+ "max_width": null,
832
+ "min_height": null,
833
+ "min_width": null,
834
+ "object_fit": null,
835
+ "object_position": null,
836
+ "order": null,
837
+ "overflow": null,
838
+ "overflow_x": null,
839
+ "overflow_y": null,
840
+ "padding": null,
841
+ "right": null,
842
+ "top": null,
843
+ "visibility": null,
844
+ "width": null
845
+ }
846
+ },
847
+ "299f0b46936f450092d10b436f6b43a3": {
848
+ "model_module": "@jupyter-widgets/controls",
849
+ "model_module_version": "1.5.0",
850
+ "model_name": "ProgressStyleModel",
851
+ "state": {
852
+ "_model_module": "@jupyter-widgets/controls",
853
+ "_model_module_version": "1.5.0",
854
+ "_model_name": "ProgressStyleModel",
855
+ "_view_count": null,
856
+ "_view_module": "@jupyter-widgets/base",
857
+ "_view_module_version": "1.2.0",
858
+ "_view_name": "StyleView",
859
+ "bar_color": null,
860
+ "description_width": ""
861
+ }
862
+ },
863
+ "2b1a638fb2794b69b0f73e87ea6d072d": {
864
+ "model_module": "@jupyter-widgets/base",
865
+ "model_module_version": "1.2.0",
866
+ "model_name": "LayoutModel",
867
+ "state": {
868
+ "_model_module": "@jupyter-widgets/base",
869
+ "_model_module_version": "1.2.0",
870
+ "_model_name": "LayoutModel",
871
+ "_view_count": null,
872
+ "_view_module": "@jupyter-widgets/base",
873
+ "_view_module_version": "1.2.0",
874
+ "_view_name": "LayoutView",
875
+ "align_content": null,
876
+ "align_items": null,
877
+ "align_self": null,
878
+ "border": null,
879
+ "bottom": null,
880
+ "display": null,
881
+ "flex": null,
882
+ "flex_flow": null,
883
+ "grid_area": null,
884
+ "grid_auto_columns": null,
885
+ "grid_auto_flow": null,
886
+ "grid_auto_rows": null,
887
+ "grid_column": null,
888
+ "grid_gap": null,
889
+ "grid_row": null,
890
+ "grid_template_areas": null,
891
+ "grid_template_columns": null,
892
+ "grid_template_rows": null,
893
+ "height": null,
894
+ "justify_content": null,
895
+ "justify_items": null,
896
+ "left": null,
897
+ "margin": null,
898
+ "max_height": null,
899
+ "max_width": null,
900
+ "min_height": null,
901
+ "min_width": null,
902
+ "object_fit": null,
903
+ "object_position": null,
904
+ "order": null,
905
+ "overflow": null,
906
+ "overflow_x": null,
907
+ "overflow_y": null,
908
+ "padding": null,
909
+ "right": null,
910
+ "top": null,
911
+ "visibility": null,
912
+ "width": null
913
+ }
914
+ },
915
+ "31e628d2e8c740b2be7fca4705d1374c": {
916
+ "model_module": "@jupyter-widgets/controls",
917
+ "model_module_version": "1.5.0",
918
+ "model_name": "DescriptionStyleModel",
919
+ "state": {
920
+ "_model_module": "@jupyter-widgets/controls",
921
+ "_model_module_version": "1.5.0",
922
+ "_model_name": "DescriptionStyleModel",
923
+ "_view_count": null,
924
+ "_view_module": "@jupyter-widgets/base",
925
+ "_view_module_version": "1.2.0",
926
+ "_view_name": "StyleView",
927
+ "description_width": ""
928
+ }
929
+ },
930
+ "38e5a6017a5f43d088c9d62d46069ff6": {
931
+ "model_module": "@jupyter-widgets/base",
932
+ "model_module_version": "1.2.0",
933
+ "model_name": "LayoutModel",
934
+ "state": {
935
+ "_model_module": "@jupyter-widgets/base",
936
+ "_model_module_version": "1.2.0",
937
+ "_model_name": "LayoutModel",
938
+ "_view_count": null,
939
+ "_view_module": "@jupyter-widgets/base",
940
+ "_view_module_version": "1.2.0",
941
+ "_view_name": "LayoutView",
942
+ "align_content": null,
943
+ "align_items": null,
944
+ "align_self": null,
945
+ "border": null,
946
+ "bottom": null,
947
+ "display": null,
948
+ "flex": null,
949
+ "flex_flow": null,
950
+ "grid_area": null,
951
+ "grid_auto_columns": null,
952
+ "grid_auto_flow": null,
953
+ "grid_auto_rows": null,
954
+ "grid_column": null,
955
+ "grid_gap": null,
956
+ "grid_row": null,
957
+ "grid_template_areas": null,
958
+ "grid_template_columns": null,
959
+ "grid_template_rows": null,
960
+ "height": null,
961
+ "justify_content": null,
962
+ "justify_items": null,
963
+ "left": null,
964
+ "margin": null,
965
+ "max_height": null,
966
+ "max_width": null,
967
+ "min_height": null,
968
+ "min_width": null,
969
+ "object_fit": null,
970
+ "object_position": null,
971
+ "order": null,
972
+ "overflow": null,
973
+ "overflow_x": null,
974
+ "overflow_y": null,
975
+ "padding": null,
976
+ "right": null,
977
+ "top": null,
978
+ "visibility": null,
979
+ "width": null
980
+ }
981
+ },
982
+ "3cf3d82361884b55b2bd03ac4ec57d55": {
983
+ "model_module": "@jupyter-widgets/controls",
984
+ "model_module_version": "1.5.0",
985
+ "model_name": "ProgressStyleModel",
986
+ "state": {
987
+ "_model_module": "@jupyter-widgets/controls",
988
+ "_model_module_version": "1.5.0",
989
+ "_model_name": "ProgressStyleModel",
990
+ "_view_count": null,
991
+ "_view_module": "@jupyter-widgets/base",
992
+ "_view_module_version": "1.2.0",
993
+ "_view_name": "StyleView",
994
+ "bar_color": null,
995
+ "description_width": ""
996
+ }
997
+ },
998
+ "3e836d356ce74139944aa886508ac3a7": {
999
+ "model_module": "@jupyter-widgets/controls",
1000
+ "model_module_version": "1.5.0",
1001
+ "model_name": "ProgressStyleModel",
1002
+ "state": {
1003
+ "_model_module": "@jupyter-widgets/controls",
1004
+ "_model_module_version": "1.5.0",
1005
+ "_model_name": "ProgressStyleModel",
1006
+ "_view_count": null,
1007
+ "_view_module": "@jupyter-widgets/base",
1008
+ "_view_module_version": "1.2.0",
1009
+ "_view_name": "StyleView",
1010
+ "bar_color": null,
1011
+ "description_width": ""
1012
+ }
1013
+ },
1014
+ "43053627932b4edea85fdeeb34d7a53c": {
1015
+ "model_module": "@jupyter-widgets/base",
1016
+ "model_module_version": "1.2.0",
1017
+ "model_name": "LayoutModel",
1018
+ "state": {
1019
+ "_model_module": "@jupyter-widgets/base",
1020
+ "_model_module_version": "1.2.0",
1021
+ "_model_name": "LayoutModel",
1022
+ "_view_count": null,
1023
+ "_view_module": "@jupyter-widgets/base",
1024
+ "_view_module_version": "1.2.0",
1025
+ "_view_name": "LayoutView",
1026
+ "align_content": null,
1027
+ "align_items": null,
1028
+ "align_self": null,
1029
+ "border": null,
1030
+ "bottom": null,
1031
+ "display": null,
1032
+ "flex": null,
1033
+ "flex_flow": null,
1034
+ "grid_area": null,
1035
+ "grid_auto_columns": null,
1036
+ "grid_auto_flow": null,
1037
+ "grid_auto_rows": null,
1038
+ "grid_column": null,
1039
+ "grid_gap": null,
1040
+ "grid_row": null,
1041
+ "grid_template_areas": null,
1042
+ "grid_template_columns": null,
1043
+ "grid_template_rows": null,
1044
+ "height": null,
1045
+ "justify_content": null,
1046
+ "justify_items": null,
1047
+ "left": null,
1048
+ "margin": null,
1049
+ "max_height": null,
1050
+ "max_width": null,
1051
+ "min_height": null,
1052
+ "min_width": null,
1053
+ "object_fit": null,
1054
+ "object_position": null,
1055
+ "order": null,
1056
+ "overflow": null,
1057
+ "overflow_x": null,
1058
+ "overflow_y": null,
1059
+ "padding": null,
1060
+ "right": null,
1061
+ "top": null,
1062
+ "visibility": null,
1063
+ "width": null
1064
+ }
1065
+ },
1066
+ "47ee5f2d6b7644d8a351c0804ed3a85e": {
1067
+ "model_module": "@jupyter-widgets/base",
1068
+ "model_module_version": "1.2.0",
1069
+ "model_name": "LayoutModel",
1070
+ "state": {
1071
+ "_model_module": "@jupyter-widgets/base",
1072
+ "_model_module_version": "1.2.0",
1073
+ "_model_name": "LayoutModel",
1074
+ "_view_count": null,
1075
+ "_view_module": "@jupyter-widgets/base",
1076
+ "_view_module_version": "1.2.0",
1077
+ "_view_name": "LayoutView",
1078
+ "align_content": null,
1079
+ "align_items": null,
1080
+ "align_self": null,
1081
+ "border": null,
1082
+ "bottom": null,
1083
+ "display": null,
1084
+ "flex": null,
1085
+ "flex_flow": null,
1086
+ "grid_area": null,
1087
+ "grid_auto_columns": null,
1088
+ "grid_auto_flow": null,
1089
+ "grid_auto_rows": null,
1090
+ "grid_column": null,
1091
+ "grid_gap": null,
1092
+ "grid_row": null,
1093
+ "grid_template_areas": null,
1094
+ "grid_template_columns": null,
1095
+ "grid_template_rows": null,
1096
+ "height": null,
1097
+ "justify_content": null,
1098
+ "justify_items": null,
1099
+ "left": null,
1100
+ "margin": null,
1101
+ "max_height": null,
1102
+ "max_width": null,
1103
+ "min_height": null,
1104
+ "min_width": null,
1105
+ "object_fit": null,
1106
+ "object_position": null,
1107
+ "order": null,
1108
+ "overflow": null,
1109
+ "overflow_x": null,
1110
+ "overflow_y": null,
1111
+ "padding": null,
1112
+ "right": null,
1113
+ "top": null,
1114
+ "visibility": null,
1115
+ "width": null
1116
+ }
1117
+ },
1118
+ "4888b08f9cc54d1f8a7199e4f0139aeb": {
1119
+ "model_module": "@jupyter-widgets/controls",
1120
+ "model_module_version": "1.5.0",
1121
+ "model_name": "HTMLModel",
1122
+ "state": {
1123
+ "_dom_classes": [],
1124
+ "_model_module": "@jupyter-widgets/controls",
1125
+ "_model_module_version": "1.5.0",
1126
+ "_model_name": "HTMLModel",
1127
+ "_view_count": null,
1128
+ "_view_module": "@jupyter-widgets/controls",
1129
+ "_view_module_version": "1.5.0",
1130
+ "_view_name": "HTMLView",
1131
+ "description": "",
1132
+ "description_tooltip": null,
1133
+ "layout": "IPY_MODEL_47ee5f2d6b7644d8a351c0804ed3a85e",
1134
+ "placeholder": "​",
1135
+ "style": "IPY_MODEL_738be44b9d8245bfacbb2b515217fe2f",
1136
+ "value": "Downloading (…)/main/tokenizer.json: 100%"
1137
+ }
1138
+ },
1139
+ "5867a9979abc4440a64d1894199a2704": {
1140
+ "model_module": "@jupyter-widgets/base",
1141
+ "model_module_version": "1.2.0",
1142
+ "model_name": "LayoutModel",
1143
+ "state": {
1144
+ "_model_module": "@jupyter-widgets/base",
1145
+ "_model_module_version": "1.2.0",
1146
+ "_model_name": "LayoutModel",
1147
+ "_view_count": null,
1148
+ "_view_module": "@jupyter-widgets/base",
1149
+ "_view_module_version": "1.2.0",
1150
+ "_view_name": "LayoutView",
1151
+ "align_content": null,
1152
+ "align_items": null,
1153
+ "align_self": null,
1154
+ "border": null,
1155
+ "bottom": null,
1156
+ "display": null,
1157
+ "flex": null,
1158
+ "flex_flow": null,
1159
+ "grid_area": null,
1160
+ "grid_auto_columns": null,
1161
+ "grid_auto_flow": null,
1162
+ "grid_auto_rows": null,
1163
+ "grid_column": null,
1164
+ "grid_gap": null,
1165
+ "grid_row": null,
1166
+ "grid_template_areas": null,
1167
+ "grid_template_columns": null,
1168
+ "grid_template_rows": null,
1169
+ "height": null,
1170
+ "justify_content": null,
1171
+ "justify_items": null,
1172
+ "left": null,
1173
+ "margin": null,
1174
+ "max_height": null,
1175
+ "max_width": null,
1176
+ "min_height": null,
1177
+ "min_width": null,
1178
+ "object_fit": null,
1179
+ "object_position": null,
1180
+ "order": null,
1181
+ "overflow": null,
1182
+ "overflow_x": null,
1183
+ "overflow_y": null,
1184
+ "padding": null,
1185
+ "right": null,
1186
+ "top": null,
1187
+ "visibility": null,
1188
+ "width": null
1189
+ }
1190
+ },
1191
+ "5c5c72fdad194864a1b71ed5637a7efc": {
1192
+ "model_module": "@jupyter-widgets/controls",
1193
+ "model_module_version": "1.5.0",
1194
+ "model_name": "FloatProgressModel",
1195
+ "state": {
1196
+ "_dom_classes": [],
1197
+ "_model_module": "@jupyter-widgets/controls",
1198
+ "_model_module_version": "1.5.0",
1199
+ "_model_name": "FloatProgressModel",
1200
+ "_view_count": null,
1201
+ "_view_module": "@jupyter-widgets/controls",
1202
+ "_view_module_version": "1.5.0",
1203
+ "_view_name": "ProgressView",
1204
+ "bar_style": "success",
1205
+ "description": "",
1206
+ "description_tooltip": null,
1207
+ "layout": "IPY_MODEL_b041fdd5345b4cb1bf0b4ddd1aa4f40c",
1208
+ "max": 466247.0,
1209
+ "min": 0.0,
1210
+ "orientation": "horizontal",
1211
+ "style": "IPY_MODEL_acc9a4eede7647a49445b89c9ea92cea",
1212
+ "value": 466247.0
1213
+ }
1214
+ },
1215
+ "5cc6716d300e446399e65ac8dd72dccf": {
1216
+ "model_module": "@jupyter-widgets/base",
1217
+ "model_module_version": "1.2.0",
1218
+ "model_name": "LayoutModel",
1219
+ "state": {
1220
+ "_model_module": "@jupyter-widgets/base",
1221
+ "_model_module_version": "1.2.0",
1222
+ "_model_name": "LayoutModel",
1223
+ "_view_count": null,
1224
+ "_view_module": "@jupyter-widgets/base",
1225
+ "_view_module_version": "1.2.0",
1226
+ "_view_name": "LayoutView",
1227
+ "align_content": null,
1228
+ "align_items": null,
1229
+ "align_self": null,
1230
+ "border": null,
1231
+ "bottom": null,
1232
+ "display": null,
1233
+ "flex": null,
1234
+ "flex_flow": null,
1235
+ "grid_area": null,
1236
+ "grid_auto_columns": null,
1237
+ "grid_auto_flow": null,
1238
+ "grid_auto_rows": null,
1239
+ "grid_column": null,
1240
+ "grid_gap": null,
1241
+ "grid_row": null,
1242
+ "grid_template_areas": null,
1243
+ "grid_template_columns": null,
1244
+ "grid_template_rows": null,
1245
+ "height": null,
1246
+ "justify_content": null,
1247
+ "justify_items": null,
1248
+ "left": null,
1249
+ "margin": null,
1250
+ "max_height": null,
1251
+ "max_width": null,
1252
+ "min_height": null,
1253
+ "min_width": null,
1254
+ "object_fit": null,
1255
+ "object_position": null,
1256
+ "order": null,
1257
+ "overflow": null,
1258
+ "overflow_x": null,
1259
+ "overflow_y": null,
1260
+ "padding": null,
1261
+ "right": null,
1262
+ "top": null,
1263
+ "visibility": null,
1264
+ "width": null
1265
+ }
1266
+ },
1267
+ "67baaac3028142e8b813c46f7dfe5a36": {
1268
+ "model_module": "@jupyter-widgets/controls",
1269
+ "model_module_version": "1.5.0",
1270
+ "model_name": "DescriptionStyleModel",
1271
+ "state": {
1272
+ "_model_module": "@jupyter-widgets/controls",
1273
+ "_model_module_version": "1.5.0",
1274
+ "_model_name": "DescriptionStyleModel",
1275
+ "_view_count": null,
1276
+ "_view_module": "@jupyter-widgets/base",
1277
+ "_view_module_version": "1.2.0",
1278
+ "_view_name": "StyleView",
1279
+ "description_width": ""
1280
+ }
1281
+ },
1282
+ "6a4ad7e517e347d282b9e2674624b7e7": {
1283
+ "model_module": "@jupyter-widgets/controls",
1284
+ "model_module_version": "1.5.0",
1285
+ "model_name": "HTMLModel",
1286
+ "state": {
1287
+ "_dom_classes": [],
1288
+ "_model_module": "@jupyter-widgets/controls",
1289
+ "_model_module_version": "1.5.0",
1290
+ "_model_name": "HTMLModel",
1291
+ "_view_count": null,
1292
+ "_view_module": "@jupyter-widgets/controls",
1293
+ "_view_module_version": "1.5.0",
1294
+ "_view_name": "HTMLView",
1295
+ "description": "",
1296
+ "description_tooltip": null,
1297
+ "layout": "IPY_MODEL_015ee89d5e874c818cdaff8a2f05c22d",
1298
+ "placeholder": "​",
1299
+ "style": "IPY_MODEL_1017fcfb8a8e4f05b7f170ea647f9153",
1300
+ "value": " 612/612 [00:00&lt;00:00, 26.7kB/s]"
1301
+ }
1302
+ },
1303
+ "6bd547c8fa4745ff814c526e3c5f67ff": {
1304
+ "model_module": "@jupyter-widgets/controls",
1305
+ "model_module_version": "1.5.0",
1306
+ "model_name": "DescriptionStyleModel",
1307
+ "state": {
1308
+ "_model_module": "@jupyter-widgets/controls",
1309
+ "_model_module_version": "1.5.0",
1310
+ "_model_name": "DescriptionStyleModel",
1311
+ "_view_count": null,
1312
+ "_view_module": "@jupyter-widgets/base",
1313
+ "_view_module_version": "1.2.0",
1314
+ "_view_name": "StyleView",
1315
+ "description_width": ""
1316
+ }
1317
+ },
1318
+ "703ed0de51694202b67cc2d006f10c5a": {
1319
+ "model_module": "@jupyter-widgets/controls",
1320
+ "model_module_version": "1.5.0",
1321
+ "model_name": "HTMLModel",
1322
+ "state": {
1323
+ "_dom_classes": [],
1324
+ "_model_module": "@jupyter-widgets/controls",
1325
+ "_model_module_version": "1.5.0",
1326
+ "_model_name": "HTMLModel",
1327
+ "_view_count": null,
1328
+ "_view_module": "@jupyter-widgets/controls",
1329
+ "_view_module_version": "1.5.0",
1330
+ "_view_name": "HTMLView",
1331
+ "description": "",
1332
+ "description_tooltip": null,
1333
+ "layout": "IPY_MODEL_43053627932b4edea85fdeeb34d7a53c",
1334
+ "placeholder": "​",
1335
+ "style": "IPY_MODEL_d9f09e15efdf4809af048238299005ef",
1336
+ "value": " 350/350 [00:00&lt;00:00, 14.4kB/s]"
1337
+ }
1338
+ },
1339
+ "728389ff6763493a8c0f0bb1de66fadc": {
1340
+ "model_module": "@jupyter-widgets/base",
1341
+ "model_module_version": "1.2.0",
1342
+ "model_name": "LayoutModel",
1343
+ "state": {
1344
+ "_model_module": "@jupyter-widgets/base",
1345
+ "_model_module_version": "1.2.0",
1346
+ "_model_name": "LayoutModel",
1347
+ "_view_count": null,
1348
+ "_view_module": "@jupyter-widgets/base",
1349
+ "_view_module_version": "1.2.0",
1350
+ "_view_name": "LayoutView",
1351
+ "align_content": null,
1352
+ "align_items": null,
1353
+ "align_self": null,
1354
+ "border": null,
1355
+ "bottom": null,
1356
+ "display": null,
1357
+ "flex": null,
1358
+ "flex_flow": null,
1359
+ "grid_area": null,
1360
+ "grid_auto_columns": null,
1361
+ "grid_auto_flow": null,
1362
+ "grid_auto_rows": null,
1363
+ "grid_column": null,
1364
+ "grid_gap": null,
1365
+ "grid_row": null,
1366
+ "grid_template_areas": null,
1367
+ "grid_template_columns": null,
1368
+ "grid_template_rows": null,
1369
+ "height": null,
1370
+ "justify_content": null,
1371
+ "justify_items": null,
1372
+ "left": null,
1373
+ "margin": null,
1374
+ "max_height": null,
1375
+ "max_width": null,
1376
+ "min_height": null,
1377
+ "min_width": null,
1378
+ "object_fit": null,
1379
+ "object_position": null,
1380
+ "order": null,
1381
+ "overflow": null,
1382
+ "overflow_x": null,
1383
+ "overflow_y": null,
1384
+ "padding": null,
1385
+ "right": null,
1386
+ "top": null,
1387
+ "visibility": null,
1388
+ "width": null
1389
+ }
1390
+ },
1391
+ "738be44b9d8245bfacbb2b515217fe2f": {
1392
+ "model_module": "@jupyter-widgets/controls",
1393
+ "model_module_version": "1.5.0",
1394
+ "model_name": "DescriptionStyleModel",
1395
+ "state": {
1396
+ "_model_module": "@jupyter-widgets/controls",
1397
+ "_model_module_version": "1.5.0",
1398
+ "_model_name": "DescriptionStyleModel",
1399
+ "_view_count": null,
1400
+ "_view_module": "@jupyter-widgets/base",
1401
+ "_view_module_version": "1.2.0",
1402
+ "_view_name": "StyleView",
1403
+ "description_width": ""
1404
+ }
1405
+ },
1406
+ "739bafcd739241aaa5f2992176c85e58": {
1407
+ "model_module": "@jupyter-widgets/controls",
1408
+ "model_module_version": "1.5.0",
1409
+ "model_name": "DescriptionStyleModel",
1410
+ "state": {
1411
+ "_model_module": "@jupyter-widgets/controls",
1412
+ "_model_module_version": "1.5.0",
1413
+ "_model_name": "DescriptionStyleModel",
1414
+ "_view_count": null,
1415
+ "_view_module": "@jupyter-widgets/base",
1416
+ "_view_module_version": "1.2.0",
1417
+ "_view_name": "StyleView",
1418
+ "description_width": ""
1419
+ }
1420
+ },
1421
+ "73eec9d7aad24824ab878ec617b9f4a8": {
1422
+ "model_module": "@jupyter-widgets/controls",
1423
+ "model_module_version": "1.5.0",
1424
+ "model_name": "HTMLModel",
1425
+ "state": {
1426
+ "_dom_classes": [],
1427
+ "_model_module": "@jupyter-widgets/controls",
1428
+ "_model_module_version": "1.5.0",
1429
+ "_model_name": "HTMLModel",
1430
+ "_view_count": null,
1431
+ "_view_module": "@jupyter-widgets/controls",
1432
+ "_view_module_version": "1.5.0",
1433
+ "_view_name": "HTMLView",
1434
+ "description": "",
1435
+ "description_tooltip": null,
1436
+ "layout": "IPY_MODEL_b8f7681ae1974b21bc73a86d9bd0dc13",
1437
+ "placeholder": "​",
1438
+ "style": "IPY_MODEL_0804cfeca1a6489b930b877613bc6dcb",
1439
+ "value": "Downloading pytorch_model.bin: 100%"
1440
+ }
1441
+ },
1442
+ "75e40a7c6b9e4941abeb7bd46bab91ed": {
1443
+ "model_module": "@jupyter-widgets/controls",
1444
+ "model_module_version": "1.5.0",
1445
+ "model_name": "ProgressStyleModel",
1446
+ "state": {
1447
+ "_model_module": "@jupyter-widgets/controls",
1448
+ "_model_module_version": "1.5.0",
1449
+ "_model_name": "ProgressStyleModel",
1450
+ "_view_count": null,
1451
+ "_view_module": "@jupyter-widgets/base",
1452
+ "_view_module_version": "1.2.0",
1453
+ "_view_name": "StyleView",
1454
+ "bar_color": null,
1455
+ "description_width": ""
1456
+ }
1457
+ },
1458
+ "76c21e9959a746ff844d3c3cee8f4dba": {
1459
+ "model_module": "@jupyter-widgets/controls",
1460
+ "model_module_version": "1.5.0",
1461
+ "model_name": "HTMLModel",
1462
+ "state": {
1463
+ "_dom_classes": [],
1464
+ "_model_module": "@jupyter-widgets/controls",
1465
+ "_model_module_version": "1.5.0",
1466
+ "_model_name": "HTMLModel",
1467
+ "_view_count": null,
1468
+ "_view_module": "@jupyter-widgets/controls",
1469
+ "_view_module_version": "1.5.0",
1470
+ "_view_name": "HTMLView",
1471
+ "description": "",
1472
+ "description_tooltip": null,
1473
+ "layout": "IPY_MODEL_04a4e4d8e06c4dc8a0220e79c81f48e3",
1474
+ "placeholder": "​",
1475
+ "style": "IPY_MODEL_31e628d2e8c740b2be7fca4705d1374c",
1476
+ "value": "100%"
1477
+ }
1478
+ },
1479
+ "7876aff2f3d24a53af0c20e4d6ba1c94": {
1480
+ "model_module": "@jupyter-widgets/controls",
1481
+ "model_module_version": "1.5.0",
1482
+ "model_name": "HBoxModel",
1483
+ "state": {
1484
+ "_dom_classes": [],
1485
+ "_model_module": "@jupyter-widgets/controls",
1486
+ "_model_module_version": "1.5.0",
1487
+ "_model_name": "HBoxModel",
1488
+ "_view_count": null,
1489
+ "_view_module": "@jupyter-widgets/controls",
1490
+ "_view_module_version": "1.5.0",
1491
+ "_view_name": "HBoxView",
1492
+ "box_style": "",
1493
+ "children": [
1494
+ "IPY_MODEL_12095e20ae504e7d9fff53cd8baca6a8",
1495
+ "IPY_MODEL_cf46572053f6463fb4ebd4fcaf0121e3",
1496
+ "IPY_MODEL_089281cd484c4889b2cddd3ee55aad6e"
1497
+ ],
1498
+ "layout": "IPY_MODEL_b63dc39182534430aa662a90cb731664"
1499
+ }
1500
+ },
1501
+ "7bbe332d901749c1ab35e01ead65b105": {
1502
+ "model_module": "@jupyter-widgets/controls",
1503
+ "model_module_version": "1.5.0",
1504
+ "model_name": "HTMLModel",
1505
+ "state": {
1506
+ "_dom_classes": [],
1507
+ "_model_module": "@jupyter-widgets/controls",
1508
+ "_model_module_version": "1.5.0",
1509
+ "_model_name": "HTMLModel",
1510
+ "_view_count": null,
1511
+ "_view_module": "@jupyter-widgets/controls",
1512
+ "_view_module_version": "1.5.0",
1513
+ "_view_name": "HTMLView",
1514
+ "description": "",
1515
+ "description_tooltip": null,
1516
+ "layout": "IPY_MODEL_5cc6716d300e446399e65ac8dd72dccf",
1517
+ "placeholder": "​",
1518
+ "style": "IPY_MODEL_67baaac3028142e8b813c46f7dfe5a36",
1519
+ "value": "Downloading (…)lve/main/config.json: 100%"
1520
+ }
1521
+ },
1522
+ "8bd5b0abca4e4b1ab2a4dc575319b6a9": {
1523
+ "model_module": "@jupyter-widgets/base",
1524
+ "model_module_version": "1.2.0",
1525
+ "model_name": "LayoutModel",
1526
+ "state": {
1527
+ "_model_module": "@jupyter-widgets/base",
1528
+ "_model_module_version": "1.2.0",
1529
+ "_model_name": "LayoutModel",
1530
+ "_view_count": null,
1531
+ "_view_module": "@jupyter-widgets/base",
1532
+ "_view_module_version": "1.2.0",
1533
+ "_view_name": "LayoutView",
1534
+ "align_content": null,
1535
+ "align_items": null,
1536
+ "align_self": null,
1537
+ "border": null,
1538
+ "bottom": null,
1539
+ "display": null,
1540
+ "flex": null,
1541
+ "flex_flow": null,
1542
+ "grid_area": null,
1543
+ "grid_auto_columns": null,
1544
+ "grid_auto_flow": null,
1545
+ "grid_auto_rows": null,
1546
+ "grid_column": null,
1547
+ "grid_gap": null,
1548
+ "grid_row": null,
1549
+ "grid_template_areas": null,
1550
+ "grid_template_columns": null,
1551
+ "grid_template_rows": null,
1552
+ "height": null,
1553
+ "justify_content": null,
1554
+ "justify_items": null,
1555
+ "left": null,
1556
+ "margin": null,
1557
+ "max_height": null,
1558
+ "max_width": null,
1559
+ "min_height": null,
1560
+ "min_width": null,
1561
+ "object_fit": null,
1562
+ "object_position": null,
1563
+ "order": null,
1564
+ "overflow": null,
1565
+ "overflow_x": null,
1566
+ "overflow_y": null,
1567
+ "padding": null,
1568
+ "right": null,
1569
+ "top": null,
1570
+ "visibility": null,
1571
+ "width": null
1572
+ }
1573
+ },
1574
+ "8dde647640d14d77971154ec85674a6b": {
1575
+ "model_module": "@jupyter-widgets/base",
1576
+ "model_module_version": "1.2.0",
1577
+ "model_name": "LayoutModel",
1578
+ "state": {
1579
+ "_model_module": "@jupyter-widgets/base",
1580
+ "_model_module_version": "1.2.0",
1581
+ "_model_name": "LayoutModel",
1582
+ "_view_count": null,
1583
+ "_view_module": "@jupyter-widgets/base",
1584
+ "_view_module_version": "1.2.0",
1585
+ "_view_name": "LayoutView",
1586
+ "align_content": null,
1587
+ "align_items": null,
1588
+ "align_self": null,
1589
+ "border": null,
1590
+ "bottom": null,
1591
+ "display": null,
1592
+ "flex": null,
1593
+ "flex_flow": null,
1594
+ "grid_area": null,
1595
+ "grid_auto_columns": null,
1596
+ "grid_auto_flow": null,
1597
+ "grid_auto_rows": null,
1598
+ "grid_column": null,
1599
+ "grid_gap": null,
1600
+ "grid_row": null,
1601
+ "grid_template_areas": null,
1602
+ "grid_template_columns": null,
1603
+ "grid_template_rows": null,
1604
+ "height": null,
1605
+ "justify_content": null,
1606
+ "justify_items": null,
1607
+ "left": null,
1608
+ "margin": null,
1609
+ "max_height": null,
1610
+ "max_width": null,
1611
+ "min_height": null,
1612
+ "min_width": null,
1613
+ "object_fit": null,
1614
+ "object_position": null,
1615
+ "order": null,
1616
+ "overflow": null,
1617
+ "overflow_x": null,
1618
+ "overflow_y": null,
1619
+ "padding": null,
1620
+ "right": null,
1621
+ "top": null,
1622
+ "visibility": null,
1623
+ "width": null
1624
+ }
1625
+ },
1626
+ "916cfb71473e41cf9f36066faf2cebdc": {
1627
+ "model_module": "@jupyter-widgets/controls",
1628
+ "model_module_version": "1.5.0",
1629
+ "model_name": "DescriptionStyleModel",
1630
+ "state": {
1631
+ "_model_module": "@jupyter-widgets/controls",
1632
+ "_model_module_version": "1.5.0",
1633
+ "_model_name": "DescriptionStyleModel",
1634
+ "_view_count": null,
1635
+ "_view_module": "@jupyter-widgets/base",
1636
+ "_view_module_version": "1.2.0",
1637
+ "_view_name": "StyleView",
1638
+ "description_width": ""
1639
+ }
1640
+ },
1641
+ "9cc517bd3c02412192ab1d76cf33ee73": {
1642
+ "model_module": "@jupyter-widgets/base",
1643
+ "model_module_version": "1.2.0",
1644
+ "model_name": "LayoutModel",
1645
+ "state": {
1646
+ "_model_module": "@jupyter-widgets/base",
1647
+ "_model_module_version": "1.2.0",
1648
+ "_model_name": "LayoutModel",
1649
+ "_view_count": null,
1650
+ "_view_module": "@jupyter-widgets/base",
1651
+ "_view_module_version": "1.2.0",
1652
+ "_view_name": "LayoutView",
1653
+ "align_content": null,
1654
+ "align_items": null,
1655
+ "align_self": null,
1656
+ "border": null,
1657
+ "bottom": null,
1658
+ "display": null,
1659
+ "flex": null,
1660
+ "flex_flow": null,
1661
+ "grid_area": null,
1662
+ "grid_auto_columns": null,
1663
+ "grid_auto_flow": null,
1664
+ "grid_auto_rows": null,
1665
+ "grid_column": null,
1666
+ "grid_gap": null,
1667
+ "grid_row": null,
1668
+ "grid_template_areas": null,
1669
+ "grid_template_columns": null,
1670
+ "grid_template_rows": null,
1671
+ "height": null,
1672
+ "justify_content": null,
1673
+ "justify_items": null,
1674
+ "left": null,
1675
+ "margin": null,
1676
+ "max_height": null,
1677
+ "max_width": null,
1678
+ "min_height": null,
1679
+ "min_width": null,
1680
+ "object_fit": null,
1681
+ "object_position": null,
1682
+ "order": null,
1683
+ "overflow": null,
1684
+ "overflow_x": null,
1685
+ "overflow_y": null,
1686
+ "padding": null,
1687
+ "right": null,
1688
+ "top": null,
1689
+ "visibility": null,
1690
+ "width": null
1691
+ }
1692
+ },
1693
+ "9d7b3990a0da4003994bcdc839127521": {
1694
+ "model_module": "@jupyter-widgets/controls",
1695
+ "model_module_version": "1.5.0",
1696
+ "model_name": "FloatProgressModel",
1697
+ "state": {
1698
+ "_dom_classes": [],
1699
+ "_model_module": "@jupyter-widgets/controls",
1700
+ "_model_module_version": "1.5.0",
1701
+ "_model_name": "FloatProgressModel",
1702
+ "_view_count": null,
1703
+ "_view_module": "@jupyter-widgets/controls",
1704
+ "_view_module_version": "1.5.0",
1705
+ "_view_name": "ProgressView",
1706
+ "bar_style": "success",
1707
+ "description": "",
1708
+ "description_tooltip": null,
1709
+ "layout": "IPY_MODEL_f52616a01da94db18878ce2f9591fcfb",
1710
+ "max": 231508.0,
1711
+ "min": 0.0,
1712
+ "orientation": "horizontal",
1713
+ "style": "IPY_MODEL_3e836d356ce74139944aa886508ac3a7",
1714
+ "value": 231508.0
1715
+ }
1716
+ },
1717
+ "9ddd368390d949c6b4fb40463871ba01": {
1718
+ "model_module": "@jupyter-widgets/controls",
1719
+ "model_module_version": "1.5.0",
1720
+ "model_name": "HTMLModel",
1721
+ "state": {
1722
+ "_dom_classes": [],
1723
+ "_model_module": "@jupyter-widgets/controls",
1724
+ "_model_module_version": "1.5.0",
1725
+ "_model_name": "HTMLModel",
1726
+ "_view_count": null,
1727
+ "_view_module": "@jupyter-widgets/controls",
1728
+ "_view_module_version": "1.5.0",
1729
+ "_view_name": "HTMLView",
1730
+ "description": "",
1731
+ "description_tooltip": null,
1732
+ "layout": "IPY_MODEL_ce0d870e6f8d4f7eb8895d67f22176ca",
1733
+ "placeholder": "​",
1734
+ "style": "IPY_MODEL_b4773f0ecef64f5ea248693fdfbb568e",
1735
+ "value": " 17492/17492 [2:24:05&lt;00:00, 2.84it/s]"
1736
+ }
1737
+ },
1738
+ "a977f4c23c4e40089d7bc9ce0ca728c5": {
1739
+ "model_module": "@jupyter-widgets/controls",
1740
+ "model_module_version": "1.5.0",
1741
+ "model_name": "DescriptionStyleModel",
1742
+ "state": {
1743
+ "_model_module": "@jupyter-widgets/controls",
1744
+ "_model_module_version": "1.5.0",
1745
+ "_model_name": "DescriptionStyleModel",
1746
+ "_view_count": null,
1747
+ "_view_module": "@jupyter-widgets/base",
1748
+ "_view_module_version": "1.2.0",
1749
+ "_view_name": "StyleView",
1750
+ "description_width": ""
1751
+ }
1752
+ },
1753
+ "acc9a4eede7647a49445b89c9ea92cea": {
1754
+ "model_module": "@jupyter-widgets/controls",
1755
+ "model_module_version": "1.5.0",
1756
+ "model_name": "ProgressStyleModel",
1757
+ "state": {
1758
+ "_model_module": "@jupyter-widgets/controls",
1759
+ "_model_module_version": "1.5.0",
1760
+ "_model_name": "ProgressStyleModel",
1761
+ "_view_count": null,
1762
+ "_view_module": "@jupyter-widgets/base",
1763
+ "_view_module_version": "1.2.0",
1764
+ "_view_name": "StyleView",
1765
+ "bar_color": null,
1766
+ "description_width": ""
1767
+ }
1768
+ },
1769
+ "b041fdd5345b4cb1bf0b4ddd1aa4f40c": {
1770
+ "model_module": "@jupyter-widgets/base",
1771
+ "model_module_version": "1.2.0",
1772
+ "model_name": "LayoutModel",
1773
+ "state": {
1774
+ "_model_module": "@jupyter-widgets/base",
1775
+ "_model_module_version": "1.2.0",
1776
+ "_model_name": "LayoutModel",
1777
+ "_view_count": null,
1778
+ "_view_module": "@jupyter-widgets/base",
1779
+ "_view_module_version": "1.2.0",
1780
+ "_view_name": "LayoutView",
1781
+ "align_content": null,
1782
+ "align_items": null,
1783
+ "align_self": null,
1784
+ "border": null,
1785
+ "bottom": null,
1786
+ "display": null,
1787
+ "flex": null,
1788
+ "flex_flow": null,
1789
+ "grid_area": null,
1790
+ "grid_auto_columns": null,
1791
+ "grid_auto_flow": null,
1792
+ "grid_auto_rows": null,
1793
+ "grid_column": null,
1794
+ "grid_gap": null,
1795
+ "grid_row": null,
1796
+ "grid_template_areas": null,
1797
+ "grid_template_columns": null,
1798
+ "grid_template_rows": null,
1799
+ "height": null,
1800
+ "justify_content": null,
1801
+ "justify_items": null,
1802
+ "left": null,
1803
+ "margin": null,
1804
+ "max_height": null,
1805
+ "max_width": null,
1806
+ "min_height": null,
1807
+ "min_width": null,
1808
+ "object_fit": null,
1809
+ "object_position": null,
1810
+ "order": null,
1811
+ "overflow": null,
1812
+ "overflow_x": null,
1813
+ "overflow_y": null,
1814
+ "padding": null,
1815
+ "right": null,
1816
+ "top": null,
1817
+ "visibility": null,
1818
+ "width": null
1819
+ }
1820
+ },
1821
+ "b4773f0ecef64f5ea248693fdfbb568e": {
1822
+ "model_module": "@jupyter-widgets/controls",
1823
+ "model_module_version": "1.5.0",
1824
+ "model_name": "DescriptionStyleModel",
1825
+ "state": {
1826
+ "_model_module": "@jupyter-widgets/controls",
1827
+ "_model_module_version": "1.5.0",
1828
+ "_model_name": "DescriptionStyleModel",
1829
+ "_view_count": null,
1830
+ "_view_module": "@jupyter-widgets/base",
1831
+ "_view_module_version": "1.2.0",
1832
+ "_view_name": "StyleView",
1833
+ "description_width": ""
1834
+ }
1835
+ },
1836
+ "b5ee209943d746a9a47ce936a9d10475": {
1837
+ "model_module": "@jupyter-widgets/base",
1838
+ "model_module_version": "1.2.0",
1839
+ "model_name": "LayoutModel",
1840
+ "state": {
1841
+ "_model_module": "@jupyter-widgets/base",
1842
+ "_model_module_version": "1.2.0",
1843
+ "_model_name": "LayoutModel",
1844
+ "_view_count": null,
1845
+ "_view_module": "@jupyter-widgets/base",
1846
+ "_view_module_version": "1.2.0",
1847
+ "_view_name": "LayoutView",
1848
+ "align_content": null,
1849
+ "align_items": null,
1850
+ "align_self": null,
1851
+ "border": null,
1852
+ "bottom": null,
1853
+ "display": null,
1854
+ "flex": null,
1855
+ "flex_flow": null,
1856
+ "grid_area": null,
1857
+ "grid_auto_columns": null,
1858
+ "grid_auto_flow": null,
1859
+ "grid_auto_rows": null,
1860
+ "grid_column": null,
1861
+ "grid_gap": null,
1862
+ "grid_row": null,
1863
+ "grid_template_areas": null,
1864
+ "grid_template_columns": null,
1865
+ "grid_template_rows": null,
1866
+ "height": null,
1867
+ "justify_content": null,
1868
+ "justify_items": null,
1869
+ "left": null,
1870
+ "margin": null,
1871
+ "max_height": null,
1872
+ "max_width": null,
1873
+ "min_height": null,
1874
+ "min_width": null,
1875
+ "object_fit": null,
1876
+ "object_position": null,
1877
+ "order": null,
1878
+ "overflow": null,
1879
+ "overflow_x": null,
1880
+ "overflow_y": null,
1881
+ "padding": null,
1882
+ "right": null,
1883
+ "top": null,
1884
+ "visibility": null,
1885
+ "width": null
1886
+ }
1887
+ },
1888
+ "b63dc39182534430aa662a90cb731664": {
1889
+ "model_module": "@jupyter-widgets/base",
1890
+ "model_module_version": "1.2.0",
1891
+ "model_name": "LayoutModel",
1892
+ "state": {
1893
+ "_model_module": "@jupyter-widgets/base",
1894
+ "_model_module_version": "1.2.0",
1895
+ "_model_name": "LayoutModel",
1896
+ "_view_count": null,
1897
+ "_view_module": "@jupyter-widgets/base",
1898
+ "_view_module_version": "1.2.0",
1899
+ "_view_name": "LayoutView",
1900
+ "align_content": null,
1901
+ "align_items": null,
1902
+ "align_self": null,
1903
+ "border": null,
1904
+ "bottom": null,
1905
+ "display": null,
1906
+ "flex": null,
1907
+ "flex_flow": null,
1908
+ "grid_area": null,
1909
+ "grid_auto_columns": null,
1910
+ "grid_auto_flow": null,
1911
+ "grid_auto_rows": null,
1912
+ "grid_column": null,
1913
+ "grid_gap": null,
1914
+ "grid_row": null,
1915
+ "grid_template_areas": null,
1916
+ "grid_template_columns": null,
1917
+ "grid_template_rows": null,
1918
+ "height": null,
1919
+ "justify_content": null,
1920
+ "justify_items": null,
1921
+ "left": null,
1922
+ "margin": null,
1923
+ "max_height": null,
1924
+ "max_width": null,
1925
+ "min_height": null,
1926
+ "min_width": null,
1927
+ "object_fit": null,
1928
+ "object_position": null,
1929
+ "order": null,
1930
+ "overflow": null,
1931
+ "overflow_x": null,
1932
+ "overflow_y": null,
1933
+ "padding": null,
1934
+ "right": null,
1935
+ "top": null,
1936
+ "visibility": null,
1937
+ "width": null
1938
+ }
1939
+ },
1940
+ "b8f7681ae1974b21bc73a86d9bd0dc13": {
1941
+ "model_module": "@jupyter-widgets/base",
1942
+ "model_module_version": "1.2.0",
1943
+ "model_name": "LayoutModel",
1944
+ "state": {
1945
+ "_model_module": "@jupyter-widgets/base",
1946
+ "_model_module_version": "1.2.0",
1947
+ "_model_name": "LayoutModel",
1948
+ "_view_count": null,
1949
+ "_view_module": "@jupyter-widgets/base",
1950
+ "_view_module_version": "1.2.0",
1951
+ "_view_name": "LayoutView",
1952
+ "align_content": null,
1953
+ "align_items": null,
1954
+ "align_self": null,
1955
+ "border": null,
1956
+ "bottom": null,
1957
+ "display": null,
1958
+ "flex": null,
1959
+ "flex_flow": null,
1960
+ "grid_area": null,
1961
+ "grid_auto_columns": null,
1962
+ "grid_auto_flow": null,
1963
+ "grid_auto_rows": null,
1964
+ "grid_column": null,
1965
+ "grid_gap": null,
1966
+ "grid_row": null,
1967
+ "grid_template_areas": null,
1968
+ "grid_template_columns": null,
1969
+ "grid_template_rows": null,
1970
+ "height": null,
1971
+ "justify_content": null,
1972
+ "justify_items": null,
1973
+ "left": null,
1974
+ "margin": null,
1975
+ "max_height": null,
1976
+ "max_width": null,
1977
+ "min_height": null,
1978
+ "min_width": null,
1979
+ "object_fit": null,
1980
+ "object_position": null,
1981
+ "order": null,
1982
+ "overflow": null,
1983
+ "overflow_x": null,
1984
+ "overflow_y": null,
1985
+ "padding": null,
1986
+ "right": null,
1987
+ "top": null,
1988
+ "visibility": null,
1989
+ "width": null
1990
+ }
1991
+ },
1992
+ "bb422963eb084ec783bfcf190950a2f0": {
1993
+ "model_module": "@jupyter-widgets/controls",
1994
+ "model_module_version": "1.5.0",
1995
+ "model_name": "HBoxModel",
1996
+ "state": {
1997
+ "_dom_classes": [],
1998
+ "_model_module": "@jupyter-widgets/controls",
1999
+ "_model_module_version": "1.5.0",
2000
+ "_model_name": "HBoxModel",
2001
+ "_view_count": null,
2002
+ "_view_module": "@jupyter-widgets/controls",
2003
+ "_view_module_version": "1.5.0",
2004
+ "_view_name": "HBoxView",
2005
+ "box_style": "",
2006
+ "children": [
2007
+ "IPY_MODEL_4888b08f9cc54d1f8a7199e4f0139aeb",
2008
+ "IPY_MODEL_5c5c72fdad194864a1b71ed5637a7efc",
2009
+ "IPY_MODEL_df2f8334d0db4148bcea4cca910f5228"
2010
+ ],
2011
+ "layout": "IPY_MODEL_2842c25aef774a7b9eab85c90f18b933"
2012
+ }
2013
+ },
2014
+ "bda35a315662410fb7b68d63b56c5cfc": {
2015
+ "model_module": "@jupyter-widgets/base",
2016
+ "model_module_version": "1.2.0",
2017
+ "model_name": "LayoutModel",
2018
+ "state": {
2019
+ "_model_module": "@jupyter-widgets/base",
2020
+ "_model_module_version": "1.2.0",
2021
+ "_model_name": "LayoutModel",
2022
+ "_view_count": null,
2023
+ "_view_module": "@jupyter-widgets/base",
2024
+ "_view_module_version": "1.2.0",
2025
+ "_view_name": "LayoutView",
2026
+ "align_content": null,
2027
+ "align_items": null,
2028
+ "align_self": null,
2029
+ "border": null,
2030
+ "bottom": null,
2031
+ "display": null,
2032
+ "flex": null,
2033
+ "flex_flow": null,
2034
+ "grid_area": null,
2035
+ "grid_auto_columns": null,
2036
+ "grid_auto_flow": null,
2037
+ "grid_auto_rows": null,
2038
+ "grid_column": null,
2039
+ "grid_gap": null,
2040
+ "grid_row": null,
2041
+ "grid_template_areas": null,
2042
+ "grid_template_columns": null,
2043
+ "grid_template_rows": null,
2044
+ "height": null,
2045
+ "justify_content": null,
2046
+ "justify_items": null,
2047
+ "left": null,
2048
+ "margin": null,
2049
+ "max_height": null,
2050
+ "max_width": null,
2051
+ "min_height": null,
2052
+ "min_width": null,
2053
+ "object_fit": null,
2054
+ "object_position": null,
2055
+ "order": null,
2056
+ "overflow": null,
2057
+ "overflow_x": null,
2058
+ "overflow_y": null,
2059
+ "padding": null,
2060
+ "right": null,
2061
+ "top": null,
2062
+ "visibility": null,
2063
+ "width": null
2064
+ }
2065
+ },
2066
+ "bee95ee151074c8f99728c877d60b16e": {
2067
+ "model_module": "@jupyter-widgets/controls",
2068
+ "model_module_version": "1.5.0",
2069
+ "model_name": "DescriptionStyleModel",
2070
+ "state": {
2071
+ "_model_module": "@jupyter-widgets/controls",
2072
+ "_model_module_version": "1.5.0",
2073
+ "_model_name": "DescriptionStyleModel",
2074
+ "_view_count": null,
2075
+ "_view_module": "@jupyter-widgets/base",
2076
+ "_view_module_version": "1.2.0",
2077
+ "_view_name": "StyleView",
2078
+ "description_width": ""
2079
+ }
2080
+ },
2081
+ "bf7e94fe0aba40cea4d15a6f598be1ea": {
2082
+ "model_module": "@jupyter-widgets/controls",
2083
+ "model_module_version": "1.5.0",
2084
+ "model_name": "HBoxModel",
2085
+ "state": {
2086
+ "_dom_classes": [],
2087
+ "_model_module": "@jupyter-widgets/controls",
2088
+ "_model_module_version": "1.5.0",
2089
+ "_model_name": "HBoxModel",
2090
+ "_view_count": null,
2091
+ "_view_module": "@jupyter-widgets/controls",
2092
+ "_view_module_version": "1.5.0",
2093
+ "_view_name": "HBoxView",
2094
+ "box_style": "",
2095
+ "children": [
2096
+ "IPY_MODEL_2004f819be47491a933ea34bd72cfcc1",
2097
+ "IPY_MODEL_e44c83eeed31480592f70fc2017aad2d",
2098
+ "IPY_MODEL_703ed0de51694202b67cc2d006f10c5a"
2099
+ ],
2100
+ "layout": "IPY_MODEL_2b1a638fb2794b69b0f73e87ea6d072d"
2101
+ }
2102
+ },
2103
+ "c09779cc5dad442abb4319432b6e2d1a": {
2104
+ "model_module": "@jupyter-widgets/controls",
2105
+ "model_module_version": "1.5.0",
2106
+ "model_name": "HTMLModel",
2107
+ "state": {
2108
+ "_dom_classes": [],
2109
+ "_model_module": "@jupyter-widgets/controls",
2110
+ "_model_module_version": "1.5.0",
2111
+ "_model_name": "HTMLModel",
2112
+ "_view_count": null,
2113
+ "_view_module": "@jupyter-widgets/controls",
2114
+ "_view_module_version": "1.5.0",
2115
+ "_view_name": "HTMLView",
2116
+ "description": "",
2117
+ "description_tooltip": null,
2118
+ "layout": "IPY_MODEL_ce54313c49594e3a9b47544c0828b1da",
2119
+ "placeholder": "​",
2120
+ "style": "IPY_MODEL_a977f4c23c4e40089d7bc9ce0ca728c5",
2121
+ "value": "Downloading (…)solve/main/vocab.txt: 100%"
2122
+ }
2123
+ },
2124
+ "c8af93bd46334dac82e376643918f119": {
2125
+ "model_module": "@jupyter-widgets/base",
2126
+ "model_module_version": "1.2.0",
2127
+ "model_name": "LayoutModel",
2128
+ "state": {
2129
+ "_model_module": "@jupyter-widgets/base",
2130
+ "_model_module_version": "1.2.0",
2131
+ "_model_name": "LayoutModel",
2132
+ "_view_count": null,
2133
+ "_view_module": "@jupyter-widgets/base",
2134
+ "_view_module_version": "1.2.0",
2135
+ "_view_name": "LayoutView",
2136
+ "align_content": null,
2137
+ "align_items": null,
2138
+ "align_self": null,
2139
+ "border": null,
2140
+ "bottom": null,
2141
+ "display": null,
2142
+ "flex": null,
2143
+ "flex_flow": null,
2144
+ "grid_area": null,
2145
+ "grid_auto_columns": null,
2146
+ "grid_auto_flow": null,
2147
+ "grid_auto_rows": null,
2148
+ "grid_column": null,
2149
+ "grid_gap": null,
2150
+ "grid_row": null,
2151
+ "grid_template_areas": null,
2152
+ "grid_template_columns": null,
2153
+ "grid_template_rows": null,
2154
+ "height": null,
2155
+ "justify_content": null,
2156
+ "justify_items": null,
2157
+ "left": null,
2158
+ "margin": null,
2159
+ "max_height": null,
2160
+ "max_width": null,
2161
+ "min_height": null,
2162
+ "min_width": null,
2163
+ "object_fit": null,
2164
+ "object_position": null,
2165
+ "order": null,
2166
+ "overflow": null,
2167
+ "overflow_x": null,
2168
+ "overflow_y": null,
2169
+ "padding": null,
2170
+ "right": null,
2171
+ "top": null,
2172
+ "visibility": null,
2173
+ "width": null
2174
+ }
2175
+ },
2176
+ "ce0d870e6f8d4f7eb8895d67f22176ca": {
2177
+ "model_module": "@jupyter-widgets/base",
2178
+ "model_module_version": "1.2.0",
2179
+ "model_name": "LayoutModel",
2180
+ "state": {
2181
+ "_model_module": "@jupyter-widgets/base",
2182
+ "_model_module_version": "1.2.0",
2183
+ "_model_name": "LayoutModel",
2184
+ "_view_count": null,
2185
+ "_view_module": "@jupyter-widgets/base",
2186
+ "_view_module_version": "1.2.0",
2187
+ "_view_name": "LayoutView",
2188
+ "align_content": null,
2189
+ "align_items": null,
2190
+ "align_self": null,
2191
+ "border": null,
2192
+ "bottom": null,
2193
+ "display": null,
2194
+ "flex": null,
2195
+ "flex_flow": null,
2196
+ "grid_area": null,
2197
+ "grid_auto_columns": null,
2198
+ "grid_auto_flow": null,
2199
+ "grid_auto_rows": null,
2200
+ "grid_column": null,
2201
+ "grid_gap": null,
2202
+ "grid_row": null,
2203
+ "grid_template_areas": null,
2204
+ "grid_template_columns": null,
2205
+ "grid_template_rows": null,
2206
+ "height": null,
2207
+ "justify_content": null,
2208
+ "justify_items": null,
2209
+ "left": null,
2210
+ "margin": null,
2211
+ "max_height": null,
2212
+ "max_width": null,
2213
+ "min_height": null,
2214
+ "min_width": null,
2215
+ "object_fit": null,
2216
+ "object_position": null,
2217
+ "order": null,
2218
+ "overflow": null,
2219
+ "overflow_x": null,
2220
+ "overflow_y": null,
2221
+ "padding": null,
2222
+ "right": null,
2223
+ "top": null,
2224
+ "visibility": null,
2225
+ "width": null
2226
+ }
2227
+ },
2228
+ "ce54313c49594e3a9b47544c0828b1da": {
2229
+ "model_module": "@jupyter-widgets/base",
2230
+ "model_module_version": "1.2.0",
2231
+ "model_name": "LayoutModel",
2232
+ "state": {
2233
+ "_model_module": "@jupyter-widgets/base",
2234
+ "_model_module_version": "1.2.0",
2235
+ "_model_name": "LayoutModel",
2236
+ "_view_count": null,
2237
+ "_view_module": "@jupyter-widgets/base",
2238
+ "_view_module_version": "1.2.0",
2239
+ "_view_name": "LayoutView",
2240
+ "align_content": null,
2241
+ "align_items": null,
2242
+ "align_self": null,
2243
+ "border": null,
2244
+ "bottom": null,
2245
+ "display": null,
2246
+ "flex": null,
2247
+ "flex_flow": null,
2248
+ "grid_area": null,
2249
+ "grid_auto_columns": null,
2250
+ "grid_auto_flow": null,
2251
+ "grid_auto_rows": null,
2252
+ "grid_column": null,
2253
+ "grid_gap": null,
2254
+ "grid_row": null,
2255
+ "grid_template_areas": null,
2256
+ "grid_template_columns": null,
2257
+ "grid_template_rows": null,
2258
+ "height": null,
2259
+ "justify_content": null,
2260
+ "justify_items": null,
2261
+ "left": null,
2262
+ "margin": null,
2263
+ "max_height": null,
2264
+ "max_width": null,
2265
+ "min_height": null,
2266
+ "min_width": null,
2267
+ "object_fit": null,
2268
+ "object_position": null,
2269
+ "order": null,
2270
+ "overflow": null,
2271
+ "overflow_x": null,
2272
+ "overflow_y": null,
2273
+ "padding": null,
2274
+ "right": null,
2275
+ "top": null,
2276
+ "visibility": null,
2277
+ "width": null
2278
+ }
2279
+ },
2280
+ "cf46572053f6463fb4ebd4fcaf0121e3": {
2281
+ "model_module": "@jupyter-widgets/controls",
2282
+ "model_module_version": "1.5.0",
2283
+ "model_name": "FloatProgressModel",
2284
+ "state": {
2285
+ "_dom_classes": [],
2286
+ "_model_module": "@jupyter-widgets/controls",
2287
+ "_model_module_version": "1.5.0",
2288
+ "_model_name": "FloatProgressModel",
2289
+ "_view_count": null,
2290
+ "_view_module": "@jupyter-widgets/controls",
2291
+ "_view_module_version": "1.5.0",
2292
+ "_view_name": "ProgressView",
2293
+ "bar_style": "success",
2294
+ "description": "",
2295
+ "description_tooltip": null,
2296
+ "layout": "IPY_MODEL_fa1a6d7af8a041479bab305634dfdbdf",
2297
+ "max": 112.0,
2298
+ "min": 0.0,
2299
+ "orientation": "horizontal",
2300
+ "style": "IPY_MODEL_fbe6b400ba214967ac7020a910404935",
2301
+ "value": 112.0
2302
+ }
2303
+ },
2304
+ "cfdcfa34092946f2a963cb2efaaa69ad": {
2305
+ "model_module": "@jupyter-widgets/controls",
2306
+ "model_module_version": "1.5.0",
2307
+ "model_name": "DescriptionStyleModel",
2308
+ "state": {
2309
+ "_model_module": "@jupyter-widgets/controls",
2310
+ "_model_module_version": "1.5.0",
2311
+ "_model_name": "DescriptionStyleModel",
2312
+ "_view_count": null,
2313
+ "_view_module": "@jupyter-widgets/base",
2314
+ "_view_module_version": "1.2.0",
2315
+ "_view_name": "StyleView",
2316
+ "description_width": ""
2317
+ }
2318
+ },
2319
+ "d450a5a84ea04020a24228c4acd81696": {
2320
+ "model_module": "@jupyter-widgets/controls",
2321
+ "model_module_version": "1.5.0",
2322
+ "model_name": "HBoxModel",
2323
+ "state": {
2324
+ "_dom_classes": [],
2325
+ "_model_module": "@jupyter-widgets/controls",
2326
+ "_model_module_version": "1.5.0",
2327
+ "_model_name": "HBoxModel",
2328
+ "_view_count": null,
2329
+ "_view_module": "@jupyter-widgets/controls",
2330
+ "_view_module_version": "1.5.0",
2331
+ "_view_name": "HBoxView",
2332
+ "box_style": "",
2333
+ "children": [
2334
+ "IPY_MODEL_c09779cc5dad442abb4319432b6e2d1a",
2335
+ "IPY_MODEL_9d7b3990a0da4003994bcdc839127521",
2336
+ "IPY_MODEL_151ab56449e8416cb04ce3d0be5d8899"
2337
+ ],
2338
+ "layout": "IPY_MODEL_9cc517bd3c02412192ab1d76cf33ee73"
2339
+ }
2340
+ },
2341
+ "d9f09e15efdf4809af048238299005ef": {
2342
+ "model_module": "@jupyter-widgets/controls",
2343
+ "model_module_version": "1.5.0",
2344
+ "model_name": "DescriptionStyleModel",
2345
+ "state": {
2346
+ "_model_module": "@jupyter-widgets/controls",
2347
+ "_model_module_version": "1.5.0",
2348
+ "_model_name": "DescriptionStyleModel",
2349
+ "_view_count": null,
2350
+ "_view_module": "@jupyter-widgets/base",
2351
+ "_view_module_version": "1.2.0",
2352
+ "_view_name": "StyleView",
2353
+ "description_width": ""
2354
+ }
2355
+ },
2356
+ "dee5ee6686494be8b7be41e01576cd77": {
2357
+ "model_module": "@jupyter-widgets/controls",
2358
+ "model_module_version": "1.5.0",
2359
+ "model_name": "DescriptionStyleModel",
2360
+ "state": {
2361
+ "_model_module": "@jupyter-widgets/controls",
2362
+ "_model_module_version": "1.5.0",
2363
+ "_model_name": "DescriptionStyleModel",
2364
+ "_view_count": null,
2365
+ "_view_module": "@jupyter-widgets/base",
2366
+ "_view_module_version": "1.2.0",
2367
+ "_view_name": "StyleView",
2368
+ "description_width": ""
2369
+ }
2370
+ },
2371
+ "df2f8334d0db4148bcea4cca910f5228": {
2372
+ "model_module": "@jupyter-widgets/controls",
2373
+ "model_module_version": "1.5.0",
2374
+ "model_name": "HTMLModel",
2375
+ "state": {
2376
+ "_dom_classes": [],
2377
+ "_model_module": "@jupyter-widgets/controls",
2378
+ "_model_module_version": "1.5.0",
2379
+ "_model_name": "HTMLModel",
2380
+ "_view_count": null,
2381
+ "_view_module": "@jupyter-widgets/controls",
2382
+ "_view_module_version": "1.5.0",
2383
+ "_view_name": "HTMLView",
2384
+ "description": "",
2385
+ "description_tooltip": null,
2386
+ "layout": "IPY_MODEL_24bf29b8f9384543ba43093895045582",
2387
+ "placeholder": "​",
2388
+ "style": "IPY_MODEL_916cfb71473e41cf9f36066faf2cebdc",
2389
+ "value": " 466k/466k [00:00&lt;00:00, 7.57MB/s]"
2390
+ }
2391
+ },
2392
+ "e0f8d3bc44474dd9a512846b4aa34870": {
2393
+ "model_module": "@jupyter-widgets/controls",
2394
+ "model_module_version": "1.5.0",
2395
+ "model_name": "ProgressStyleModel",
2396
+ "state": {
2397
+ "_model_module": "@jupyter-widgets/controls",
2398
+ "_model_module_version": "1.5.0",
2399
+ "_model_name": "ProgressStyleModel",
2400
+ "_view_count": null,
2401
+ "_view_module": "@jupyter-widgets/base",
2402
+ "_view_module_version": "1.2.0",
2403
+ "_view_name": "StyleView",
2404
+ "bar_color": null,
2405
+ "description_width": ""
2406
+ }
2407
+ },
2408
+ "e380ed94e29a4ceda0dee6b8da910a12": {
2409
+ "model_module": "@jupyter-widgets/controls",
2410
+ "model_module_version": "1.5.0",
2411
+ "model_name": "FloatProgressModel",
2412
+ "state": {
2413
+ "_dom_classes": [],
2414
+ "_model_module": "@jupyter-widgets/controls",
2415
+ "_model_module_version": "1.5.0",
2416
+ "_model_name": "FloatProgressModel",
2417
+ "_view_count": null,
2418
+ "_view_module": "@jupyter-widgets/controls",
2419
+ "_view_module_version": "1.5.0",
2420
+ "_view_name": "ProgressView",
2421
+ "bar_style": "success",
2422
+ "description": "",
2423
+ "description_tooltip": null,
2424
+ "layout": "IPY_MODEL_0c559307133043619b80d489c7970617",
2425
+ "max": 612.0,
2426
+ "min": 0.0,
2427
+ "orientation": "horizontal",
2428
+ "style": "IPY_MODEL_3cf3d82361884b55b2bd03ac4ec57d55",
2429
+ "value": 612.0
2430
+ }
2431
+ },
2432
+ "e44c83eeed31480592f70fc2017aad2d": {
2433
+ "model_module": "@jupyter-widgets/controls",
2434
+ "model_module_version": "1.5.0",
2435
+ "model_name": "FloatProgressModel",
2436
+ "state": {
2437
+ "_dom_classes": [],
2438
+ "_model_module": "@jupyter-widgets/controls",
2439
+ "_model_module_version": "1.5.0",
2440
+ "_model_name": "FloatProgressModel",
2441
+ "_view_count": null,
2442
+ "_view_module": "@jupyter-widgets/controls",
2443
+ "_view_module_version": "1.5.0",
2444
+ "_view_name": "ProgressView",
2445
+ "bar_style": "success",
2446
+ "description": "",
2447
+ "description_tooltip": null,
2448
+ "layout": "IPY_MODEL_c8af93bd46334dac82e376643918f119",
2449
+ "max": 350.0,
2450
+ "min": 0.0,
2451
+ "orientation": "horizontal",
2452
+ "style": "IPY_MODEL_e0f8d3bc44474dd9a512846b4aa34870",
2453
+ "value": 350.0
2454
+ }
2455
+ },
2456
+ "ec9c1d9e2d7e4c38955ed3455ea216f6": {
2457
+ "model_module": "@jupyter-widgets/controls",
2458
+ "model_module_version": "1.5.0",
2459
+ "model_name": "HTMLModel",
2460
+ "state": {
2461
+ "_dom_classes": [],
2462
+ "_model_module": "@jupyter-widgets/controls",
2463
+ "_model_module_version": "1.5.0",
2464
+ "_model_name": "HTMLModel",
2465
+ "_view_count": null,
2466
+ "_view_module": "@jupyter-widgets/controls",
2467
+ "_view_module_version": "1.5.0",
2468
+ "_view_name": "HTMLView",
2469
+ "description": "",
2470
+ "description_tooltip": null,
2471
+ "layout": "IPY_MODEL_f86cb31528414b07ad0d9755881bf9e5",
2472
+ "placeholder": "​",
2473
+ "style": "IPY_MODEL_cfdcfa34092946f2a963cb2efaaa69ad",
2474
+ "value": " 90.9M/90.9M [00:00&lt;00:00, 145MB/s]"
2475
+ }
2476
+ },
2477
+ "f52616a01da94db18878ce2f9591fcfb": {
2478
+ "model_module": "@jupyter-widgets/base",
2479
+ "model_module_version": "1.2.0",
2480
+ "model_name": "LayoutModel",
2481
+ "state": {
2482
+ "_model_module": "@jupyter-widgets/base",
2483
+ "_model_module_version": "1.2.0",
2484
+ "_model_name": "LayoutModel",
2485
+ "_view_count": null,
2486
+ "_view_module": "@jupyter-widgets/base",
2487
+ "_view_module_version": "1.2.0",
2488
+ "_view_name": "LayoutView",
2489
+ "align_content": null,
2490
+ "align_items": null,
2491
+ "align_self": null,
2492
+ "border": null,
2493
+ "bottom": null,
2494
+ "display": null,
2495
+ "flex": null,
2496
+ "flex_flow": null,
2497
+ "grid_area": null,
2498
+ "grid_auto_columns": null,
2499
+ "grid_auto_flow": null,
2500
+ "grid_auto_rows": null,
2501
+ "grid_column": null,
2502
+ "grid_gap": null,
2503
+ "grid_row": null,
2504
+ "grid_template_areas": null,
2505
+ "grid_template_columns": null,
2506
+ "grid_template_rows": null,
2507
+ "height": null,
2508
+ "justify_content": null,
2509
+ "justify_items": null,
2510
+ "left": null,
2511
+ "margin": null,
2512
+ "max_height": null,
2513
+ "max_width": null,
2514
+ "min_height": null,
2515
+ "min_width": null,
2516
+ "object_fit": null,
2517
+ "object_position": null,
2518
+ "order": null,
2519
+ "overflow": null,
2520
+ "overflow_x": null,
2521
+ "overflow_y": null,
2522
+ "padding": null,
2523
+ "right": null,
2524
+ "top": null,
2525
+ "visibility": null,
2526
+ "width": null
2527
+ }
2528
+ },
2529
+ "f86cb31528414b07ad0d9755881bf9e5": {
2530
+ "model_module": "@jupyter-widgets/base",
2531
+ "model_module_version": "1.2.0",
2532
+ "model_name": "LayoutModel",
2533
+ "state": {
2534
+ "_model_module": "@jupyter-widgets/base",
2535
+ "_model_module_version": "1.2.0",
2536
+ "_model_name": "LayoutModel",
2537
+ "_view_count": null,
2538
+ "_view_module": "@jupyter-widgets/base",
2539
+ "_view_module_version": "1.2.0",
2540
+ "_view_name": "LayoutView",
2541
+ "align_content": null,
2542
+ "align_items": null,
2543
+ "align_self": null,
2544
+ "border": null,
2545
+ "bottom": null,
2546
+ "display": null,
2547
+ "flex": null,
2548
+ "flex_flow": null,
2549
+ "grid_area": null,
2550
+ "grid_auto_columns": null,
2551
+ "grid_auto_flow": null,
2552
+ "grid_auto_rows": null,
2553
+ "grid_column": null,
2554
+ "grid_gap": null,
2555
+ "grid_row": null,
2556
+ "grid_template_areas": null,
2557
+ "grid_template_columns": null,
2558
+ "grid_template_rows": null,
2559
+ "height": null,
2560
+ "justify_content": null,
2561
+ "justify_items": null,
2562
+ "left": null,
2563
+ "margin": null,
2564
+ "max_height": null,
2565
+ "max_width": null,
2566
+ "min_height": null,
2567
+ "min_width": null,
2568
+ "object_fit": null,
2569
+ "object_position": null,
2570
+ "order": null,
2571
+ "overflow": null,
2572
+ "overflow_x": null,
2573
+ "overflow_y": null,
2574
+ "padding": null,
2575
+ "right": null,
2576
+ "top": null,
2577
+ "visibility": null,
2578
+ "width": null
2579
+ }
2580
+ },
2581
+ "fa1a6d7af8a041479bab305634dfdbdf": {
2582
+ "model_module": "@jupyter-widgets/base",
2583
+ "model_module_version": "1.2.0",
2584
+ "model_name": "LayoutModel",
2585
+ "state": {
2586
+ "_model_module": "@jupyter-widgets/base",
2587
+ "_model_module_version": "1.2.0",
2588
+ "_model_name": "LayoutModel",
2589
+ "_view_count": null,
2590
+ "_view_module": "@jupyter-widgets/base",
2591
+ "_view_module_version": "1.2.0",
2592
+ "_view_name": "LayoutView",
2593
+ "align_content": null,
2594
+ "align_items": null,
2595
+ "align_self": null,
2596
+ "border": null,
2597
+ "bottom": null,
2598
+ "display": null,
2599
+ "flex": null,
2600
+ "flex_flow": null,
2601
+ "grid_area": null,
2602
+ "grid_auto_columns": null,
2603
+ "grid_auto_flow": null,
2604
+ "grid_auto_rows": null,
2605
+ "grid_column": null,
2606
+ "grid_gap": null,
2607
+ "grid_row": null,
2608
+ "grid_template_areas": null,
2609
+ "grid_template_columns": null,
2610
+ "grid_template_rows": null,
2611
+ "height": null,
2612
+ "justify_content": null,
2613
+ "justify_items": null,
2614
+ "left": null,
2615
+ "margin": null,
2616
+ "max_height": null,
2617
+ "max_width": null,
2618
+ "min_height": null,
2619
+ "min_width": null,
2620
+ "object_fit": null,
2621
+ "object_position": null,
2622
+ "order": null,
2623
+ "overflow": null,
2624
+ "overflow_x": null,
2625
+ "overflow_y": null,
2626
+ "padding": null,
2627
+ "right": null,
2628
+ "top": null,
2629
+ "visibility": null,
2630
+ "width": null
2631
+ }
2632
+ },
2633
+ "fbe6b400ba214967ac7020a910404935": {
2634
+ "model_module": "@jupyter-widgets/controls",
2635
+ "model_module_version": "1.5.0",
2636
+ "model_name": "ProgressStyleModel",
2637
+ "state": {
2638
+ "_model_module": "@jupyter-widgets/controls",
2639
+ "_model_module_version": "1.5.0",
2640
+ "_model_name": "ProgressStyleModel",
2641
+ "_view_count": null,
2642
+ "_view_module": "@jupyter-widgets/base",
2643
+ "_view_module_version": "1.2.0",
2644
+ "_view_name": "StyleView",
2645
+ "bar_color": null,
2646
+ "description_width": ""
2647
+ }
2648
+ },
2649
+ "fe2339e92ef34a669751ef54d20b09fd": {
2650
+ "model_module": "@jupyter-widgets/controls",
2651
+ "model_module_version": "1.5.0",
2652
+ "model_name": "FloatProgressModel",
2653
+ "state": {
2654
+ "_dom_classes": [],
2655
+ "_model_module": "@jupyter-widgets/controls",
2656
+ "_model_module_version": "1.5.0",
2657
+ "_model_name": "FloatProgressModel",
2658
+ "_view_count": null,
2659
+ "_view_module": "@jupyter-widgets/controls",
2660
+ "_view_module_version": "1.5.0",
2661
+ "_view_name": "ProgressView",
2662
+ "bar_style": "success",
2663
+ "description": "",
2664
+ "description_tooltip": null,
2665
+ "layout": "IPY_MODEL_20cac87ded1444e4818e0448ab7748c2",
2666
+ "max": 90888945.0,
2667
+ "min": 0.0,
2668
+ "orientation": "horizontal",
2669
+ "style": "IPY_MODEL_299f0b46936f450092d10b436f6b43a3",
2670
+ "value": 90888945.0
2671
+ }
2672
+ }
2673
+ },
2674
+ "version_major": 2,
2675
+ "version_minor": 0
2676
+ }
2677
+ }
2678
+ },
2679
+ "nbformat": 4,
2680
+ "nbformat_minor": 5
2681
+ }
Notebooks/ysda-ml-02-05-process-json.ipynb ADDED
@@ -0,0 +1,867 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 1,
6
+ "id": "053d77d6",
7
+ "metadata": {
8
+ "_cell_guid": "b1076dfc-b9ad-4769-8c92-a6c4dae69d19",
9
+ "_uuid": "8f2839f25d086af736a60e9eeb907d3b93b6e0e5",
10
+ "execution": {
11
+ "iopub.execute_input": "2023-04-16T17:54:22.150398Z",
12
+ "iopub.status.busy": "2023-04-16T17:54:22.149996Z",
13
+ "iopub.status.idle": "2023-04-16T17:54:23.370151Z",
14
+ "shell.execute_reply": "2023-04-16T17:54:23.368894Z"
15
+ },
16
+ "papermill": {
17
+ "duration": 1.228699,
18
+ "end_time": "2023-04-16T17:54:23.373574",
19
+ "exception": false,
20
+ "start_time": "2023-04-16T17:54:22.144875",
21
+ "status": "completed"
22
+ },
23
+ "tags": []
24
+ },
25
+ "outputs": [],
26
+ "source": [
27
+ "import datasets\n",
28
+ "from datasets import Dataset\n",
29
+ "import numpy as np\n",
30
+ "import json\n",
31
+ "import os\n",
32
+ "from tqdm.notebook import tqdm as tqdm\n",
33
+ "\n",
34
+ "INPUT_PATH = '/kaggle/input/arxiv/arxiv-metadata-oai-snapshot.json'\n",
35
+ "OUTPUT_PATH = '/kaggle/working/articles.hf'"
36
+ ]
37
+ },
38
+ {
39
+ "cell_type": "code",
40
+ "execution_count": 2,
41
+ "id": "fa6321f0",
42
+ "metadata": {
43
+ "execution": {
44
+ "iopub.execute_input": "2023-04-16T17:54:23.379601Z",
45
+ "iopub.status.busy": "2023-04-16T17:54:23.378999Z",
46
+ "iopub.status.idle": "2023-04-16T17:54:23.389555Z",
47
+ "shell.execute_reply": "2023-04-16T17:54:23.388183Z"
48
+ },
49
+ "papermill": {
50
+ "duration": 0.016368,
51
+ "end_time": "2023-04-16T17:54:23.392224",
52
+ "exception": false,
53
+ "start_time": "2023-04-16T17:54:23.375856",
54
+ "status": "completed"
55
+ },
56
+ "tags": []
57
+ },
58
+ "outputs": [],
59
+ "source": [
60
+ "def read_json(filename):\n",
61
+ " with open(filename) as f:\n",
62
+ " for line in tqdm(f):\n",
63
+ " yield json.loads(line)\n",
64
+ "\n",
65
+ "\n",
66
+ "def prepare_text(text):\n",
67
+ " return ' '.join(text.split()) # Remove \\n\n",
68
+ "\n",
69
+ "\n",
70
+ "def prepare_articles(raw_articles):\n",
71
+ " articles = dict()\n",
72
+ " articles['id'] = []\n",
73
+ " articles['title'] = []\n",
74
+ " articles['abstract'] = []\n",
75
+ " \n",
76
+ " for raw_article in tqdm(raw_articles):\n",
77
+ " articles['id'].append(raw_article['id'])\n",
78
+ " articles['title'].append(prepare_text(raw_article['title']))\n",
79
+ " articles['abstract'].append(prepare_text(raw_article['abstract']))\n",
80
+ " \n",
81
+ " return articles"
82
+ ]
83
+ },
84
+ {
85
+ "cell_type": "code",
86
+ "execution_count": 3,
87
+ "id": "002d5a96",
88
+ "metadata": {
89
+ "execution": {
90
+ "iopub.execute_input": "2023-04-16T17:54:23.397598Z",
91
+ "iopub.status.busy": "2023-04-16T17:54:23.397210Z",
92
+ "iopub.status.idle": "2023-04-16T17:56:09.339424Z",
93
+ "shell.execute_reply": "2023-04-16T17:56:09.338210Z"
94
+ },
95
+ "papermill": {
96
+ "duration": 105.948451,
97
+ "end_time": "2023-04-16T17:56:09.342633",
98
+ "exception": false,
99
+ "start_time": "2023-04-16T17:54:23.394182",
100
+ "status": "completed"
101
+ },
102
+ "tags": []
103
+ },
104
+ "outputs": [
105
+ {
106
+ "data": {
107
+ "application/vnd.jupyter.widget-view+json": {
108
+ "model_id": "a93e04563c8b4d41ad6ff43205a3459b",
109
+ "version_major": 2,
110
+ "version_minor": 0
111
+ },
112
+ "text/plain": [
113
+ "0it [00:00, ?it/s]"
114
+ ]
115
+ },
116
+ "metadata": {},
117
+ "output_type": "display_data"
118
+ },
119
+ {
120
+ "data": {
121
+ "application/vnd.jupyter.widget-view+json": {
122
+ "model_id": "44d52183128440d0b3e84659fac0548a",
123
+ "version_major": 2,
124
+ "version_minor": 0
125
+ },
126
+ "text/plain": [
127
+ "0it [00:00, ?it/s]"
128
+ ]
129
+ },
130
+ "metadata": {},
131
+ "output_type": "display_data"
132
+ }
133
+ ],
134
+ "source": [
135
+ "raw_articles = read_json(INPUT_PATH)\n",
136
+ "articles = prepare_articles(raw_articles)\n",
137
+ "dataset = Dataset.from_dict(articles)\n",
138
+ "dataset.save_to_disk(OUTPUT_PATH)"
139
+ ]
140
+ }
141
+ ],
142
+ "metadata": {
143
+ "kernelspec": {
144
+ "display_name": "Python 3",
145
+ "language": "python",
146
+ "name": "python3"
147
+ },
148
+ "language_info": {
149
+ "codemirror_mode": {
150
+ "name": "ipython",
151
+ "version": 3
152
+ },
153
+ "file_extension": ".py",
154
+ "mimetype": "text/x-python",
155
+ "name": "python",
156
+ "nbconvert_exporter": "python",
157
+ "pygments_lexer": "ipython3",
158
+ "version": "3.7.12"
159
+ },
160
+ "papermill": {
161
+ "default_parameters": {},
162
+ "duration": 119.63838,
163
+ "end_time": "2023-04-16T17:56:11.178168",
164
+ "environment_variables": {},
165
+ "exception": null,
166
+ "input_path": "__notebook__.ipynb",
167
+ "output_path": "__notebook__.ipynb",
168
+ "parameters": {},
169
+ "start_time": "2023-04-16T17:54:11.539788",
170
+ "version": "2.4.0"
171
+ },
172
+ "widgets": {
173
+ "application/vnd.jupyter.widget-state+json": {
174
+ "state": {
175
+ "0c336528356c4b2b95f34cb48e174e0c": {
176
+ "model_module": "@jupyter-widgets/controls",
177
+ "model_module_version": "1.5.0",
178
+ "model_name": "DescriptionStyleModel",
179
+ "state": {
180
+ "_model_module": "@jupyter-widgets/controls",
181
+ "_model_module_version": "1.5.0",
182
+ "_model_name": "DescriptionStyleModel",
183
+ "_view_count": null,
184
+ "_view_module": "@jupyter-widgets/base",
185
+ "_view_module_version": "1.2.0",
186
+ "_view_name": "StyleView",
187
+ "description_width": ""
188
+ }
189
+ },
190
+ "113121abfa324736bb8e95fe1a4f1d06": {
191
+ "model_module": "@jupyter-widgets/controls",
192
+ "model_module_version": "1.5.0",
193
+ "model_name": "FloatProgressModel",
194
+ "state": {
195
+ "_dom_classes": [],
196
+ "_model_module": "@jupyter-widgets/controls",
197
+ "_model_module_version": "1.5.0",
198
+ "_model_name": "FloatProgressModel",
199
+ "_view_count": null,
200
+ "_view_module": "@jupyter-widgets/controls",
201
+ "_view_module_version": "1.5.0",
202
+ "_view_name": "ProgressView",
203
+ "bar_style": "success",
204
+ "description": "",
205
+ "description_tooltip": null,
206
+ "layout": "IPY_MODEL_6a64fe0560924b0cad3764b0a6c54ec1",
207
+ "max": 1.0,
208
+ "min": 0.0,
209
+ "orientation": "horizontal",
210
+ "style": "IPY_MODEL_cb6a75abc992433f937a46df79408fc8",
211
+ "value": 1.0
212
+ }
213
+ },
214
+ "2d791a9fdda541379914e44842a56916": {
215
+ "model_module": "@jupyter-widgets/controls",
216
+ "model_module_version": "1.5.0",
217
+ "model_name": "DescriptionStyleModel",
218
+ "state": {
219
+ "_model_module": "@jupyter-widgets/controls",
220
+ "_model_module_version": "1.5.0",
221
+ "_model_name": "DescriptionStyleModel",
222
+ "_view_count": null,
223
+ "_view_module": "@jupyter-widgets/base",
224
+ "_view_module_version": "1.2.0",
225
+ "_view_name": "StyleView",
226
+ "description_width": ""
227
+ }
228
+ },
229
+ "3982ea95d169445b848b1f1424d09bac": {
230
+ "model_module": "@jupyter-widgets/base",
231
+ "model_module_version": "1.2.0",
232
+ "model_name": "LayoutModel",
233
+ "state": {
234
+ "_model_module": "@jupyter-widgets/base",
235
+ "_model_module_version": "1.2.0",
236
+ "_model_name": "LayoutModel",
237
+ "_view_count": null,
238
+ "_view_module": "@jupyter-widgets/base",
239
+ "_view_module_version": "1.2.0",
240
+ "_view_name": "LayoutView",
241
+ "align_content": null,
242
+ "align_items": null,
243
+ "align_self": null,
244
+ "border": null,
245
+ "bottom": null,
246
+ "display": null,
247
+ "flex": null,
248
+ "flex_flow": null,
249
+ "grid_area": null,
250
+ "grid_auto_columns": null,
251
+ "grid_auto_flow": null,
252
+ "grid_auto_rows": null,
253
+ "grid_column": null,
254
+ "grid_gap": null,
255
+ "grid_row": null,
256
+ "grid_template_areas": null,
257
+ "grid_template_columns": null,
258
+ "grid_template_rows": null,
259
+ "height": null,
260
+ "justify_content": null,
261
+ "justify_items": null,
262
+ "left": null,
263
+ "margin": null,
264
+ "max_height": null,
265
+ "max_width": null,
266
+ "min_height": null,
267
+ "min_width": null,
268
+ "object_fit": null,
269
+ "object_position": null,
270
+ "order": null,
271
+ "overflow": null,
272
+ "overflow_x": null,
273
+ "overflow_y": null,
274
+ "padding": null,
275
+ "right": null,
276
+ "top": null,
277
+ "visibility": null,
278
+ "width": "20px"
279
+ }
280
+ },
281
+ "44d52183128440d0b3e84659fac0548a": {
282
+ "model_module": "@jupyter-widgets/controls",
283
+ "model_module_version": "1.5.0",
284
+ "model_name": "HBoxModel",
285
+ "state": {
286
+ "_dom_classes": [],
287
+ "_model_module": "@jupyter-widgets/controls",
288
+ "_model_module_version": "1.5.0",
289
+ "_model_name": "HBoxModel",
290
+ "_view_count": null,
291
+ "_view_module": "@jupyter-widgets/controls",
292
+ "_view_module_version": "1.5.0",
293
+ "_view_name": "HBoxView",
294
+ "box_style": "",
295
+ "children": [
296
+ "IPY_MODEL_a60eea433a804579aa0320aa6ec54db8",
297
+ "IPY_MODEL_903a7b209ce44382a2e2a0dfd49fea40",
298
+ "IPY_MODEL_afe8ad7902ba49f5a56ad93dba8e1537"
299
+ ],
300
+ "layout": "IPY_MODEL_e4706baef659472aaa63e3d2588eb25c"
301
+ }
302
+ },
303
+ "466c11eed88444dead7e03947dc6c5ae": {
304
+ "model_module": "@jupyter-widgets/controls",
305
+ "model_module_version": "1.5.0",
306
+ "model_name": "HTMLModel",
307
+ "state": {
308
+ "_dom_classes": [],
309
+ "_model_module": "@jupyter-widgets/controls",
310
+ "_model_module_version": "1.5.0",
311
+ "_model_name": "HTMLModel",
312
+ "_view_count": null,
313
+ "_view_module": "@jupyter-widgets/controls",
314
+ "_view_module_version": "1.5.0",
315
+ "_view_name": "HTMLView",
316
+ "description": "",
317
+ "description_tooltip": null,
318
+ "layout": "IPY_MODEL_cfeb53d0e1d54b0cb4c1faeecaa0782d",
319
+ "placeholder": "​",
320
+ "style": "IPY_MODEL_8d807c6587c8478a92214a1f50853a5a",
321
+ "value": " 2238880/? [01:35&lt;00:00, 29540.88it/s]"
322
+ }
323
+ },
324
+ "4757c406e2c64fd48db575dc424aa9ab": {
325
+ "model_module": "@jupyter-widgets/base",
326
+ "model_module_version": "1.2.0",
327
+ "model_name": "LayoutModel",
328
+ "state": {
329
+ "_model_module": "@jupyter-widgets/base",
330
+ "_model_module_version": "1.2.0",
331
+ "_model_name": "LayoutModel",
332
+ "_view_count": null,
333
+ "_view_module": "@jupyter-widgets/base",
334
+ "_view_module_version": "1.2.0",
335
+ "_view_name": "LayoutView",
336
+ "align_content": null,
337
+ "align_items": null,
338
+ "align_self": null,
339
+ "border": null,
340
+ "bottom": null,
341
+ "display": null,
342
+ "flex": null,
343
+ "flex_flow": null,
344
+ "grid_area": null,
345
+ "grid_auto_columns": null,
346
+ "grid_auto_flow": null,
347
+ "grid_auto_rows": null,
348
+ "grid_column": null,
349
+ "grid_gap": null,
350
+ "grid_row": null,
351
+ "grid_template_areas": null,
352
+ "grid_template_columns": null,
353
+ "grid_template_rows": null,
354
+ "height": null,
355
+ "justify_content": null,
356
+ "justify_items": null,
357
+ "left": null,
358
+ "margin": null,
359
+ "max_height": null,
360
+ "max_width": null,
361
+ "min_height": null,
362
+ "min_width": null,
363
+ "object_fit": null,
364
+ "object_position": null,
365
+ "order": null,
366
+ "overflow": null,
367
+ "overflow_x": null,
368
+ "overflow_y": null,
369
+ "padding": null,
370
+ "right": null,
371
+ "top": null,
372
+ "visibility": null,
373
+ "width": null
374
+ }
375
+ },
376
+ "6a64fe0560924b0cad3764b0a6c54ec1": {
377
+ "model_module": "@jupyter-widgets/base",
378
+ "model_module_version": "1.2.0",
379
+ "model_name": "LayoutModel",
380
+ "state": {
381
+ "_model_module": "@jupyter-widgets/base",
382
+ "_model_module_version": "1.2.0",
383
+ "_model_name": "LayoutModel",
384
+ "_view_count": null,
385
+ "_view_module": "@jupyter-widgets/base",
386
+ "_view_module_version": "1.2.0",
387
+ "_view_name": "LayoutView",
388
+ "align_content": null,
389
+ "align_items": null,
390
+ "align_self": null,
391
+ "border": null,
392
+ "bottom": null,
393
+ "display": null,
394
+ "flex": null,
395
+ "flex_flow": null,
396
+ "grid_area": null,
397
+ "grid_auto_columns": null,
398
+ "grid_auto_flow": null,
399
+ "grid_auto_rows": null,
400
+ "grid_column": null,
401
+ "grid_gap": null,
402
+ "grid_row": null,
403
+ "grid_template_areas": null,
404
+ "grid_template_columns": null,
405
+ "grid_template_rows": null,
406
+ "height": null,
407
+ "justify_content": null,
408
+ "justify_items": null,
409
+ "left": null,
410
+ "margin": null,
411
+ "max_height": null,
412
+ "max_width": null,
413
+ "min_height": null,
414
+ "min_width": null,
415
+ "object_fit": null,
416
+ "object_position": null,
417
+ "order": null,
418
+ "overflow": null,
419
+ "overflow_x": null,
420
+ "overflow_y": null,
421
+ "padding": null,
422
+ "right": null,
423
+ "top": null,
424
+ "visibility": null,
425
+ "width": "20px"
426
+ }
427
+ },
428
+ "8d807c6587c8478a92214a1f50853a5a": {
429
+ "model_module": "@jupyter-widgets/controls",
430
+ "model_module_version": "1.5.0",
431
+ "model_name": "DescriptionStyleModel",
432
+ "state": {
433
+ "_model_module": "@jupyter-widgets/controls",
434
+ "_model_module_version": "1.5.0",
435
+ "_model_name": "DescriptionStyleModel",
436
+ "_view_count": null,
437
+ "_view_module": "@jupyter-widgets/base",
438
+ "_view_module_version": "1.2.0",
439
+ "_view_name": "StyleView",
440
+ "description_width": ""
441
+ }
442
+ },
443
+ "903a7b209ce44382a2e2a0dfd49fea40": {
444
+ "model_module": "@jupyter-widgets/controls",
445
+ "model_module_version": "1.5.0",
446
+ "model_name": "FloatProgressModel",
447
+ "state": {
448
+ "_dom_classes": [],
449
+ "_model_module": "@jupyter-widgets/controls",
450
+ "_model_module_version": "1.5.0",
451
+ "_model_name": "FloatProgressModel",
452
+ "_view_count": null,
453
+ "_view_module": "@jupyter-widgets/controls",
454
+ "_view_module_version": "1.5.0",
455
+ "_view_name": "ProgressView",
456
+ "bar_style": "success",
457
+ "description": "",
458
+ "description_tooltip": null,
459
+ "layout": "IPY_MODEL_3982ea95d169445b848b1f1424d09bac",
460
+ "max": 1.0,
461
+ "min": 0.0,
462
+ "orientation": "horizontal",
463
+ "style": "IPY_MODEL_b5a36475ff044f7db31af7001872b967",
464
+ "value": 1.0
465
+ }
466
+ },
467
+ "a60eea433a804579aa0320aa6ec54db8": {
468
+ "model_module": "@jupyter-widgets/controls",
469
+ "model_module_version": "1.5.0",
470
+ "model_name": "HTMLModel",
471
+ "state": {
472
+ "_dom_classes": [],
473
+ "_model_module": "@jupyter-widgets/controls",
474
+ "_model_module_version": "1.5.0",
475
+ "_model_name": "HTMLModel",
476
+ "_view_count": null,
477
+ "_view_module": "@jupyter-widgets/controls",
478
+ "_view_module_version": "1.5.0",
479
+ "_view_name": "HTMLView",
480
+ "description": "",
481
+ "description_tooltip": null,
482
+ "layout": "IPY_MODEL_c152f20b488b41218ca7253a831418ad",
483
+ "placeholder": "​",
484
+ "style": "IPY_MODEL_0c336528356c4b2b95f34cb48e174e0c",
485
+ "value": ""
486
+ }
487
+ },
488
+ "a93e04563c8b4d41ad6ff43205a3459b": {
489
+ "model_module": "@jupyter-widgets/controls",
490
+ "model_module_version": "1.5.0",
491
+ "model_name": "HBoxModel",
492
+ "state": {
493
+ "_dom_classes": [],
494
+ "_model_module": "@jupyter-widgets/controls",
495
+ "_model_module_version": "1.5.0",
496
+ "_model_name": "HBoxModel",
497
+ "_view_count": null,
498
+ "_view_module": "@jupyter-widgets/controls",
499
+ "_view_module_version": "1.5.0",
500
+ "_view_name": "HBoxView",
501
+ "box_style": "",
502
+ "children": [
503
+ "IPY_MODEL_d9d454d5308a46c491787ca33faccb33",
504
+ "IPY_MODEL_113121abfa324736bb8e95fe1a4f1d06",
505
+ "IPY_MODEL_466c11eed88444dead7e03947dc6c5ae"
506
+ ],
507
+ "layout": "IPY_MODEL_ce365fd9ffca4e399f43306afd1d82ec"
508
+ }
509
+ },
510
+ "afe8ad7902ba49f5a56ad93dba8e1537": {
511
+ "model_module": "@jupyter-widgets/controls",
512
+ "model_module_version": "1.5.0",
513
+ "model_name": "HTMLModel",
514
+ "state": {
515
+ "_dom_classes": [],
516
+ "_model_module": "@jupyter-widgets/controls",
517
+ "_model_module_version": "1.5.0",
518
+ "_model_name": "HTMLModel",
519
+ "_view_count": null,
520
+ "_view_module": "@jupyter-widgets/controls",
521
+ "_view_module_version": "1.5.0",
522
+ "_view_name": "HTMLView",
523
+ "description": "",
524
+ "description_tooltip": null,
525
+ "layout": "IPY_MODEL_4757c406e2c64fd48db575dc424aa9ab",
526
+ "placeholder": "​",
527
+ "style": "IPY_MODEL_2d791a9fdda541379914e44842a56916",
528
+ "value": " 2238880/? [01:35&lt;00:00, 29550.75it/s]"
529
+ }
530
+ },
531
+ "b4eefbed9af540289bc790d9d699a54f": {
532
+ "model_module": "@jupyter-widgets/controls",
533
+ "model_module_version": "1.5.0",
534
+ "model_name": "DescriptionStyleModel",
535
+ "state": {
536
+ "_model_module": "@jupyter-widgets/controls",
537
+ "_model_module_version": "1.5.0",
538
+ "_model_name": "DescriptionStyleModel",
539
+ "_view_count": null,
540
+ "_view_module": "@jupyter-widgets/base",
541
+ "_view_module_version": "1.2.0",
542
+ "_view_name": "StyleView",
543
+ "description_width": ""
544
+ }
545
+ },
546
+ "b5a36475ff044f7db31af7001872b967": {
547
+ "model_module": "@jupyter-widgets/controls",
548
+ "model_module_version": "1.5.0",
549
+ "model_name": "ProgressStyleModel",
550
+ "state": {
551
+ "_model_module": "@jupyter-widgets/controls",
552
+ "_model_module_version": "1.5.0",
553
+ "_model_name": "ProgressStyleModel",
554
+ "_view_count": null,
555
+ "_view_module": "@jupyter-widgets/base",
556
+ "_view_module_version": "1.2.0",
557
+ "_view_name": "StyleView",
558
+ "bar_color": null,
559
+ "description_width": ""
560
+ }
561
+ },
562
+ "c152f20b488b41218ca7253a831418ad": {
563
+ "model_module": "@jupyter-widgets/base",
564
+ "model_module_version": "1.2.0",
565
+ "model_name": "LayoutModel",
566
+ "state": {
567
+ "_model_module": "@jupyter-widgets/base",
568
+ "_model_module_version": "1.2.0",
569
+ "_model_name": "LayoutModel",
570
+ "_view_count": null,
571
+ "_view_module": "@jupyter-widgets/base",
572
+ "_view_module_version": "1.2.0",
573
+ "_view_name": "LayoutView",
574
+ "align_content": null,
575
+ "align_items": null,
576
+ "align_self": null,
577
+ "border": null,
578
+ "bottom": null,
579
+ "display": null,
580
+ "flex": null,
581
+ "flex_flow": null,
582
+ "grid_area": null,
583
+ "grid_auto_columns": null,
584
+ "grid_auto_flow": null,
585
+ "grid_auto_rows": null,
586
+ "grid_column": null,
587
+ "grid_gap": null,
588
+ "grid_row": null,
589
+ "grid_template_areas": null,
590
+ "grid_template_columns": null,
591
+ "grid_template_rows": null,
592
+ "height": null,
593
+ "justify_content": null,
594
+ "justify_items": null,
595
+ "left": null,
596
+ "margin": null,
597
+ "max_height": null,
598
+ "max_width": null,
599
+ "min_height": null,
600
+ "min_width": null,
601
+ "object_fit": null,
602
+ "object_position": null,
603
+ "order": null,
604
+ "overflow": null,
605
+ "overflow_x": null,
606
+ "overflow_y": null,
607
+ "padding": null,
608
+ "right": null,
609
+ "top": null,
610
+ "visibility": null,
611
+ "width": null
612
+ }
613
+ },
614
+ "cb6a75abc992433f937a46df79408fc8": {
615
+ "model_module": "@jupyter-widgets/controls",
616
+ "model_module_version": "1.5.0",
617
+ "model_name": "ProgressStyleModel",
618
+ "state": {
619
+ "_model_module": "@jupyter-widgets/controls",
620
+ "_model_module_version": "1.5.0",
621
+ "_model_name": "ProgressStyleModel",
622
+ "_view_count": null,
623
+ "_view_module": "@jupyter-widgets/base",
624
+ "_view_module_version": "1.2.0",
625
+ "_view_name": "StyleView",
626
+ "bar_color": null,
627
+ "description_width": ""
628
+ }
629
+ },
630
+ "ce365fd9ffca4e399f43306afd1d82ec": {
631
+ "model_module": "@jupyter-widgets/base",
632
+ "model_module_version": "1.2.0",
633
+ "model_name": "LayoutModel",
634
+ "state": {
635
+ "_model_module": "@jupyter-widgets/base",
636
+ "_model_module_version": "1.2.0",
637
+ "_model_name": "LayoutModel",
638
+ "_view_count": null,
639
+ "_view_module": "@jupyter-widgets/base",
640
+ "_view_module_version": "1.2.0",
641
+ "_view_name": "LayoutView",
642
+ "align_content": null,
643
+ "align_items": null,
644
+ "align_self": null,
645
+ "border": null,
646
+ "bottom": null,
647
+ "display": null,
648
+ "flex": null,
649
+ "flex_flow": null,
650
+ "grid_area": null,
651
+ "grid_auto_columns": null,
652
+ "grid_auto_flow": null,
653
+ "grid_auto_rows": null,
654
+ "grid_column": null,
655
+ "grid_gap": null,
656
+ "grid_row": null,
657
+ "grid_template_areas": null,
658
+ "grid_template_columns": null,
659
+ "grid_template_rows": null,
660
+ "height": null,
661
+ "justify_content": null,
662
+ "justify_items": null,
663
+ "left": null,
664
+ "margin": null,
665
+ "max_height": null,
666
+ "max_width": null,
667
+ "min_height": null,
668
+ "min_width": null,
669
+ "object_fit": null,
670
+ "object_position": null,
671
+ "order": null,
672
+ "overflow": null,
673
+ "overflow_x": null,
674
+ "overflow_y": null,
675
+ "padding": null,
676
+ "right": null,
677
+ "top": null,
678
+ "visibility": null,
679
+ "width": null
680
+ }
681
+ },
682
+ "cfeb53d0e1d54b0cb4c1faeecaa0782d": {
683
+ "model_module": "@jupyter-widgets/base",
684
+ "model_module_version": "1.2.0",
685
+ "model_name": "LayoutModel",
686
+ "state": {
687
+ "_model_module": "@jupyter-widgets/base",
688
+ "_model_module_version": "1.2.0",
689
+ "_model_name": "LayoutModel",
690
+ "_view_count": null,
691
+ "_view_module": "@jupyter-widgets/base",
692
+ "_view_module_version": "1.2.0",
693
+ "_view_name": "LayoutView",
694
+ "align_content": null,
695
+ "align_items": null,
696
+ "align_self": null,
697
+ "border": null,
698
+ "bottom": null,
699
+ "display": null,
700
+ "flex": null,
701
+ "flex_flow": null,
702
+ "grid_area": null,
703
+ "grid_auto_columns": null,
704
+ "grid_auto_flow": null,
705
+ "grid_auto_rows": null,
706
+ "grid_column": null,
707
+ "grid_gap": null,
708
+ "grid_row": null,
709
+ "grid_template_areas": null,
710
+ "grid_template_columns": null,
711
+ "grid_template_rows": null,
712
+ "height": null,
713
+ "justify_content": null,
714
+ "justify_items": null,
715
+ "left": null,
716
+ "margin": null,
717
+ "max_height": null,
718
+ "max_width": null,
719
+ "min_height": null,
720
+ "min_width": null,
721
+ "object_fit": null,
722
+ "object_position": null,
723
+ "order": null,
724
+ "overflow": null,
725
+ "overflow_x": null,
726
+ "overflow_y": null,
727
+ "padding": null,
728
+ "right": null,
729
+ "top": null,
730
+ "visibility": null,
731
+ "width": null
732
+ }
733
+ },
734
+ "d9d454d5308a46c491787ca33faccb33": {
735
+ "model_module": "@jupyter-widgets/controls",
736
+ "model_module_version": "1.5.0",
737
+ "model_name": "HTMLModel",
738
+ "state": {
739
+ "_dom_classes": [],
740
+ "_model_module": "@jupyter-widgets/controls",
741
+ "_model_module_version": "1.5.0",
742
+ "_model_name": "HTMLModel",
743
+ "_view_count": null,
744
+ "_view_module": "@jupyter-widgets/controls",
745
+ "_view_module_version": "1.5.0",
746
+ "_view_name": "HTMLView",
747
+ "description": "",
748
+ "description_tooltip": null,
749
+ "layout": "IPY_MODEL_e636986344034e2a9a6e03245aa521cc",
750
+ "placeholder": "​",
751
+ "style": "IPY_MODEL_b4eefbed9af540289bc790d9d699a54f",
752
+ "value": ""
753
+ }
754
+ },
755
+ "e4706baef659472aaa63e3d2588eb25c": {
756
+ "model_module": "@jupyter-widgets/base",
757
+ "model_module_version": "1.2.0",
758
+ "model_name": "LayoutModel",
759
+ "state": {
760
+ "_model_module": "@jupyter-widgets/base",
761
+ "_model_module_version": "1.2.0",
762
+ "_model_name": "LayoutModel",
763
+ "_view_count": null,
764
+ "_view_module": "@jupyter-widgets/base",
765
+ "_view_module_version": "1.2.0",
766
+ "_view_name": "LayoutView",
767
+ "align_content": null,
768
+ "align_items": null,
769
+ "align_self": null,
770
+ "border": null,
771
+ "bottom": null,
772
+ "display": null,
773
+ "flex": null,
774
+ "flex_flow": null,
775
+ "grid_area": null,
776
+ "grid_auto_columns": null,
777
+ "grid_auto_flow": null,
778
+ "grid_auto_rows": null,
779
+ "grid_column": null,
780
+ "grid_gap": null,
781
+ "grid_row": null,
782
+ "grid_template_areas": null,
783
+ "grid_template_columns": null,
784
+ "grid_template_rows": null,
785
+ "height": null,
786
+ "justify_content": null,
787
+ "justify_items": null,
788
+ "left": null,
789
+ "margin": null,
790
+ "max_height": null,
791
+ "max_width": null,
792
+ "min_height": null,
793
+ "min_width": null,
794
+ "object_fit": null,
795
+ "object_position": null,
796
+ "order": null,
797
+ "overflow": null,
798
+ "overflow_x": null,
799
+ "overflow_y": null,
800
+ "padding": null,
801
+ "right": null,
802
+ "top": null,
803
+ "visibility": null,
804
+ "width": null
805
+ }
806
+ },
807
+ "e636986344034e2a9a6e03245aa521cc": {
808
+ "model_module": "@jupyter-widgets/base",
809
+ "model_module_version": "1.2.0",
810
+ "model_name": "LayoutModel",
811
+ "state": {
812
+ "_model_module": "@jupyter-widgets/base",
813
+ "_model_module_version": "1.2.0",
814
+ "_model_name": "LayoutModel",
815
+ "_view_count": null,
816
+ "_view_module": "@jupyter-widgets/base",
817
+ "_view_module_version": "1.2.0",
818
+ "_view_name": "LayoutView",
819
+ "align_content": null,
820
+ "align_items": null,
821
+ "align_self": null,
822
+ "border": null,
823
+ "bottom": null,
824
+ "display": null,
825
+ "flex": null,
826
+ "flex_flow": null,
827
+ "grid_area": null,
828
+ "grid_auto_columns": null,
829
+ "grid_auto_flow": null,
830
+ "grid_auto_rows": null,
831
+ "grid_column": null,
832
+ "grid_gap": null,
833
+ "grid_row": null,
834
+ "grid_template_areas": null,
835
+ "grid_template_columns": null,
836
+ "grid_template_rows": null,
837
+ "height": null,
838
+ "justify_content": null,
839
+ "justify_items": null,
840
+ "left": null,
841
+ "margin": null,
842
+ "max_height": null,
843
+ "max_width": null,
844
+ "min_height": null,
845
+ "min_width": null,
846
+ "object_fit": null,
847
+ "object_position": null,
848
+ "order": null,
849
+ "overflow": null,
850
+ "overflow_x": null,
851
+ "overflow_y": null,
852
+ "padding": null,
853
+ "right": null,
854
+ "top": null,
855
+ "visibility": null,
856
+ "width": null
857
+ }
858
+ }
859
+ },
860
+ "version_major": 2,
861
+ "version_minor": 0
862
+ }
863
+ }
864
+ },
865
+ "nbformat": 4,
866
+ "nbformat_minor": 5
867
+ }