Upload osiria_deberta_italian_qa_evaluation.ipynb
Browse files
osiria_deberta_italian_qa_evaluation.ipynb
CHANGED
@@ -34,7 +34,7 @@
|
|
34 |
"base_uri": "https://localhost:8080/"
|
35 |
},
|
36 |
"id": "02K9xO6Gvto1",
|
37 |
-
"outputId": "
|
38 |
},
|
39 |
"outputs": [
|
40 |
{
|
@@ -43,16 +43,16 @@
|
|
43 |
"text": [
|
44 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
45 |
"Collecting git+https://github.com/huggingface/transformers\n",
|
46 |
-
" Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-
|
47 |
-
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-
|
48 |
-
" Resolved https://github.com/huggingface/transformers to commit
|
49 |
" Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
|
50 |
" Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
|
51 |
" Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
|
52 |
"Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (3.12.0)\n",
|
53 |
"Collecting huggingface-hub<1.0,>=0.14.1 (from transformers==4.30.0.dev0)\n",
|
54 |
" Downloading huggingface_hub-0.15.1-py3-none-any.whl (236 kB)\n",
|
55 |
-
"\u001b[2K \u001b[90m
|
56 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (1.22.4)\n",
|
57 |
"Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (23.1)\n",
|
58 |
"Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (6.0)\n",
|
@@ -60,10 +60,10 @@
|
|
60 |
"Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (2.27.1)\n",
|
61 |
"Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers==4.30.0.dev0)\n",
|
62 |
" Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n",
|
63 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[
|
64 |
"\u001b[?25hCollecting safetensors>=0.3.1 (from transformers==4.30.0.dev0)\n",
|
65 |
" Downloading safetensors-0.3.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n",
|
66 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[
|
67 |
"\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (4.65.0)\n",
|
68 |
"Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers==4.30.0.dev0) (2023.4.0)\n",
|
69 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers==4.30.0.dev0) (4.5.0)\n",
|
@@ -73,8 +73,8 @@
|
|
73 |
"Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.30.0.dev0) (3.4)\n",
|
74 |
"Building wheels for collected packages: transformers\n",
|
75 |
" Building wheel for transformers (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
|
76 |
-
" Created wheel for transformers: filename=transformers-4.30.0.dev0-py3-none-any.whl size=
|
77 |
-
" Stored in directory: /tmp/pip-ephem-wheel-cache-
|
78 |
"Successfully built transformers\n",
|
79 |
"Installing collected packages: tokenizers, safetensors, huggingface-hub, transformers\n",
|
80 |
"Successfully installed huggingface-hub-0.15.1 safetensors-0.3.1 tokenizers-0.13.3 transformers-4.30.0.dev0\n"
|
@@ -95,7 +95,7 @@
|
|
95 |
"base_uri": "https://localhost:8080/"
|
96 |
},
|
97 |
"id": "VKgybrUswa1q",
|
98 |
-
"outputId": "
|
99 |
},
|
100 |
"execution_count": 2,
|
101 |
"outputs": [
|
@@ -106,25 +106,25 @@
|
|
106 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
107 |
"Collecting datasets\n",
|
108 |
" Downloading datasets-2.12.0-py3-none-any.whl (474 kB)\n",
|
109 |
-
"\u001b[2K \u001b[90m
|
110 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.22.4)\n",
|
111 |
"Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n",
|
112 |
"Collecting dill<0.3.7,>=0.3.0 (from datasets)\n",
|
113 |
" Downloading dill-0.3.6-py3-none-any.whl (110 kB)\n",
|
114 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.5/110.5 kB\u001b[0m \u001b[31m14.
|
115 |
"\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n",
|
116 |
"Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.27.1)\n",
|
117 |
"Requirement already satisfied: tqdm>=4.62.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.65.0)\n",
|
118 |
"Collecting xxhash (from datasets)\n",
|
119 |
" Downloading xxhash-3.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (212 kB)\n",
|
120 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m212.5/212.5 kB\u001b[0m \u001b[
|
121 |
"\u001b[?25hCollecting multiprocess (from datasets)\n",
|
122 |
" Downloading multiprocess-0.70.14-py310-none-any.whl (134 kB)\n",
|
123 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.3/134.3 kB\u001b[0m \u001b[
|
124 |
"\u001b[?25hRequirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.4.0)\n",
|
125 |
"Collecting aiohttp (from datasets)\n",
|
126 |
" Downloading aiohttp-3.8.4-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.0 MB)\n",
|
127 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.0/1.0 MB\u001b[0m \u001b[
|
128 |
"\u001b[?25hRequirement already satisfied: huggingface-hub<1.0.0,>=0.11.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.15.1)\n",
|
129 |
"Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (23.1)\n",
|
130 |
"Collecting responses<0.19 (from datasets)\n",
|
@@ -134,15 +134,15 @@
|
|
134 |
"Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (2.0.12)\n",
|
135 |
"Collecting multidict<7.0,>=4.5 (from aiohttp->datasets)\n",
|
136 |
" Downloading multidict-6.0.4-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (114 kB)\n",
|
137 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m114.5/114.5 kB\u001b[0m \u001b[
|
138 |
"\u001b[?25hCollecting async-timeout<5.0,>=4.0.0a3 (from aiohttp->datasets)\n",
|
139 |
" Downloading async_timeout-4.0.2-py3-none-any.whl (5.8 kB)\n",
|
140 |
"Collecting yarl<2.0,>=1.0 (from aiohttp->datasets)\n",
|
141 |
" Downloading yarl-1.9.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (268 kB)\n",
|
142 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m268.8/268.8 kB\u001b[0m \u001b[
|
143 |
"\u001b[?25hCollecting frozenlist>=1.1.1 (from aiohttp->datasets)\n",
|
144 |
" Downloading frozenlist-1.3.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (149 kB)\n",
|
145 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m149.6/149.6 kB\u001b[0m \u001b[
|
146 |
"\u001b[?25hCollecting aiosignal>=1.1.2 (from aiohttp->datasets)\n",
|
147 |
" Downloading aiosignal-1.3.1-py3-none-any.whl (7.6 kB)\n",
|
148 |
"Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (3.12.0)\n",
|
@@ -169,7 +169,7 @@
|
|
169 |
"base_uri": "https://localhost:8080/"
|
170 |
},
|
171 |
"id": "xYEW0Hjqz2lo",
|
172 |
-
"outputId": "
|
173 |
},
|
174 |
"execution_count": 3,
|
175 |
"outputs": [
|
@@ -179,8 +179,8 @@
|
|
179 |
"text": [
|
180 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
181 |
"Collecting accelerate\n",
|
182 |
-
" Downloading accelerate-0.
|
183 |
-
"\u001b[2K \u001b[90m
|
184 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate) (1.22.4)\n",
|
185 |
"Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (23.1)\n",
|
186 |
"Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n",
|
@@ -197,7 +197,7 @@
|
|
197 |
"Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.6.0->accelerate) (2.1.2)\n",
|
198 |
"Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.6.0->accelerate) (1.3.0)\n",
|
199 |
"Installing collected packages: accelerate\n",
|
200 |
-
"Successfully installed accelerate-0.
|
201 |
]
|
202 |
}
|
203 |
]
|
@@ -212,7 +212,7 @@
|
|
212 |
"base_uri": "https://localhost:8080/"
|
213 |
},
|
214 |
"id": "9OFz3JdR0cQ_",
|
215 |
-
"outputId": "
|
216 |
},
|
217 |
"execution_count": 4,
|
218 |
"outputs": [
|
@@ -223,7 +223,7 @@
|
|
223 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
224 |
"Collecting evaluate\n",
|
225 |
" Downloading evaluate-0.4.0-py3-none-any.whl (81 kB)\n",
|
226 |
-
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m81.4/81.4 kB\u001b[0m \u001b[
|
227 |
"\u001b[?25hRequirement already satisfied: datasets>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from evaluate) (2.12.0)\n",
|
228 |
"Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from evaluate) (1.22.4)\n",
|
229 |
"Requirement already satisfied: dill in /usr/local/lib/python3.10/dist-packages (from evaluate) (0.3.6)\n",
|
@@ -272,7 +272,7 @@
|
|
272 |
"base_uri": "https://localhost:8080/"
|
273 |
},
|
274 |
"id": "JJhpBNwpxOTK",
|
275 |
-
"outputId": "
|
276 |
},
|
277 |
"execution_count": 5,
|
278 |
"outputs": [
|
@@ -280,18 +280,18 @@
|
|
280 |
"output_type": "stream",
|
281 |
"name": "stdout",
|
282 |
"text": [
|
283 |
-
"--2023-06-
|
284 |
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.108.133, 185.199.109.133, 185.199.110.133, ...\n",
|
285 |
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.108.133|:443... connected.\n",
|
286 |
"HTTP request sent, awaiting response... 200 OK\n",
|
287 |
"Length: 31717 (31K) [text/plain]\n",
|
288 |
"Saving to: ‘run_qa.py’\n",
|
289 |
"\n",
|
290 |
-
"run_qa.py 100%[===================>] 30.97K --.-KB/s in
|
291 |
"\n",
|
292 |
-
"2023-06-
|
293 |
"\n",
|
294 |
-
"--2023-06-
|
295 |
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.108.133, 185.199.109.133, 185.199.110.133, ...\n",
|
296 |
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.108.133|:443... connected.\n",
|
297 |
"HTTP request sent, awaiting response... 200 OK\n",
|
@@ -300,18 +300,18 @@
|
|
300 |
"\n",
|
301 |
"trainer_qa.py 100%[===================>] 6.11K --.-KB/s in 0s \n",
|
302 |
"\n",
|
303 |
-
"2023-06-
|
304 |
"\n",
|
305 |
-
"--2023-06-
|
306 |
-
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.
|
307 |
-
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.
|
308 |
"HTTP request sent, awaiting response... 200 OK\n",
|
309 |
"Length: 22777 (22K) [text/plain]\n",
|
310 |
"Saving to: ‘utils_qa.py’\n",
|
311 |
"\n",
|
312 |
-
"utils_qa.py 100%[===================>] 22.24K --.-KB/s in
|
313 |
"\n",
|
314 |
-
"2023-06-
|
315 |
"\n"
|
316 |
]
|
317 |
}
|
@@ -327,7 +327,7 @@
|
|
327 |
"base_uri": "https://localhost:8080/"
|
328 |
},
|
329 |
"id": "Loa6y9XqzXJ4",
|
330 |
-
"outputId": "
|
331 |
},
|
332 |
"execution_count": 6,
|
333 |
"outputs": [
|
@@ -361,7 +361,7 @@
|
|
361 |
"base_uri": "https://localhost:8080/"
|
362 |
},
|
363 |
"id": "B5O5Lom8x_c4",
|
364 |
-
"outputId": "
|
365 |
},
|
366 |
"execution_count": 8,
|
367 |
"outputs": [
|
@@ -369,9 +369,9 @@
|
|
369 |
"output_type": "stream",
|
370 |
"name": "stdout",
|
371 |
"text": [
|
372 |
-
"2023-06-
|
373 |
-
"06/
|
374 |
-
"06/
|
375 |
"_n_gpu=1,\n",
|
376 |
"adafactor=False,\n",
|
377 |
"adam_beta1=0.9,\n",
|
@@ -428,7 +428,7 @@
|
|
428 |
"log_level=passive,\n",
|
429 |
"log_level_replica=warning,\n",
|
430 |
"log_on_each_node=True,\n",
|
431 |
-
"logging_dir=eval_results/runs/
|
432 |
"logging_first_step=False,\n",
|
433 |
"logging_nan_inf_filter=True,\n",
|
434 |
"logging_steps=500,\n",
|
@@ -480,45 +480,46 @@
|
|
480 |
"weight_decay=0.0,\n",
|
481 |
"xpu_backend=None,\n",
|
482 |
")\n",
|
483 |
-
"06/
|
484 |
-
"Downloading builder script: 100% 4.74k/4.74k [00:00<00:00,
|
485 |
-
"06/
|
486 |
-
"06/
|
487 |
-
"06/
|
488 |
-
"Downloading metadata: 100% 2.51k/2.51k [00:00<00:00, 2.
|
489 |
-
"06/
|
490 |
-
"06/
|
491 |
-
"06/
|
492 |
-
"Downloading readme: 100% 7.27k/7.27k [00:00<00:00,
|
493 |
-
"06/
|
494 |
-
"06/
|
495 |
-
"06/
|
496 |
-
"06/
|
497 |
"Downloading and preparing dataset squad_it/default to /root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71...\n",
|
498 |
-
"06/
|
499 |
-
"Downloading data files: 0% 0/2 [00:00<?, ?it/s]06/
|
500 |
"\n",
|
501 |
"Downloading data: 0% 0.00/7.73M [00:00<?, ?B/s]\u001b[A\n",
|
502 |
-
"Downloading data: 100% 7.73M/7.73M [00:00<00:00,
|
503 |
-
"06/
|
504 |
-
"06/
|
505 |
-
"Downloading data files: 50% 1/2 [00:
|
506 |
"\n",
|
507 |
-
"Downloading data:
|
508 |
-
"
|
509 |
-
"06/
|
510 |
-
"
|
511 |
-
"
|
512 |
-
"06/
|
513 |
-
"
|
514 |
-
"
|
515 |
-
"06/
|
516 |
-
"06/
|
|
|
517 |
"Dataset squad_it downloaded and prepared to /root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71. Subsequent calls will reuse this data.\n",
|
518 |
-
"100% 2/2 [00:00<00:00,
|
519 |
-
"Downloading (…)lve/main/config.json: 100% 826/826 [00:00<00:00,
|
520 |
-
"[INFO|configuration_utils.py:669] 2023-06-
|
521 |
-
"[INFO|configuration_utils.py:725] 2023-06-
|
522 |
" \"_name_or_path\": \"osiria/deberta-italian-question-answering\",\n",
|
523 |
" \"architectures\": [\n",
|
524 |
" \"DebertaV2ForQuestionAnswering\"\n",
|
@@ -554,325 +555,300 @@
|
|
554 |
" \"vocab_size\": 50256\n",
|
555 |
"}\n",
|
556 |
"\n",
|
557 |
-
"Downloading (…)okenizer_config.json: 100% 412/412 [00:00<00:00, 2.
|
558 |
-
"Downloading (…)/main/tokenizer.json: 100% 2.02M/2.02M [00:
|
559 |
-
"[INFO|tokenization_utils_base.py:
|
560 |
-
"[INFO|tokenization_utils_base.py:
|
561 |
-
"[INFO|tokenization_utils_base.py:
|
562 |
-
"[INFO|tokenization_utils_base.py:
|
563 |
-
"[INFO|tokenization_utils_base.py:
|
564 |
-
"Downloading pytorch_model.bin: 100% 496M/496M [00:
|
565 |
-
"[INFO|modeling_utils.py:
|
566 |
-
"[INFO|modeling_utils.py:
|
567 |
"\n",
|
568 |
-
"[INFO|modeling_utils.py:
|
569 |
"If your task is similar to the task the model of the checkpoint was trained on, you can already use DebertaV2ForQuestionAnswering for predictions without further training.\n",
|
570 |
-
"Running tokenizer on prediction dataset: 0% 0/7609 [00:00<?, ? examples/s]06/
|
571 |
-
"Downloading builder script: 100% 4.53k/4.53k [00:00<00:00,
|
572 |
-
"Downloading extra modules: 100% 3.32k/3.32k [00:00<00:00, 3.
|
573 |
-
"06/
|
574 |
-
"[INFO|trainer.py:
|
575 |
-
"[INFO|trainer.py:
|
576 |
-
"[INFO|trainer.py:
|
577 |
-
"[INFO|trainer.py:
|
578 |
-
"100% 1713/1713 [04:
|
579 |
"\n",
|
580 |
" 0% 0/7609 [00:00<?, ?it/s]\u001b[A\n",
|
581 |
-
" 0%
|
582 |
-
"
|
583 |
-
" 1%
|
584 |
-
"
|
585 |
-
"
|
586 |
-
"
|
587 |
-
"
|
588 |
-
"
|
589 |
-
"
|
590 |
-
"
|
591 |
-
"
|
592 |
-
"
|
593 |
-
"
|
594 |
-
"
|
595 |
-
"
|
596 |
-
"
|
597 |
-
"
|
598 |
-
"
|
599 |
-
"
|
600 |
-
"
|
601 |
-
"
|
602 |
-
"
|
603 |
-
"
|
604 |
-
"
|
605 |
-
"
|
606 |
-
"
|
607 |
-
"
|
608 |
-
"
|
609 |
-
"
|
610 |
-
"
|
611 |
-
"
|
612 |
-
"
|
613 |
-
"
|
614 |
-
"
|
615 |
-
"
|
616 |
-
"
|
617 |
-
"
|
618 |
-
"
|
619 |
-
"
|
620 |
-
"
|
621 |
-
"
|
622 |
-
"
|
623 |
-
"
|
624 |
-
"
|
625 |
-
"
|
626 |
-
"
|
627 |
-
"
|
628 |
-
"
|
629 |
-
"
|
630 |
-
"
|
631 |
-
"
|
632 |
-
"
|
633 |
-
"
|
634 |
-
"
|
635 |
-
"
|
636 |
-
"
|
637 |
-
"
|
638 |
-
"
|
639 |
-
"
|
640 |
-
"
|
641 |
-
"
|
642 |
-
"
|
643 |
-
"
|
644 |
-
"
|
645 |
-
"
|
646 |
-
"
|
647 |
-
"
|
648 |
-
"
|
649 |
-
"
|
650 |
-
"
|
651 |
-
"
|
652 |
-
"
|
653 |
-
"
|
654 |
-
"
|
655 |
-
"
|
656 |
-
"
|
657 |
-
"
|
658 |
-
"
|
659 |
-
" 28%
|
660 |
-
"
|
661 |
-
" 29%
|
662 |
-
" 29%
|
663 |
-
"
|
664 |
-
"
|
665 |
-
" 30%
|
666 |
-
"
|
667 |
-
" 31%
|
668 |
-
"
|
669 |
-
"
|
670 |
-
"
|
671 |
-
"
|
672 |
-
" 33%
|
673 |
-
"
|
674 |
-
" 34%
|
675 |
-
"
|
676 |
-
"
|
677 |
-
" 35%
|
678 |
-
"
|
679 |
-
" 36%
|
680 |
-
"
|
681 |
-
"
|
682 |
-
"
|
683 |
-
"
|
684 |
-
" 38%
|
685 |
-
"
|
686 |
-
"
|
687 |
-
"
|
688 |
-
"
|
689 |
-
"
|
690 |
-
"
|
691 |
-
"
|
692 |
-
"
|
693 |
-
"
|
694 |
-
"
|
695 |
-
"
|
696 |
-
"
|
697 |
-
"
|
698 |
-
"
|
699 |
-
"
|
700 |
-
"
|
701 |
-
"
|
702 |
-
"
|
703 |
-
"
|
704 |
-
"
|
705 |
-
"
|
706 |
-
"
|
707 |
-
"
|
708 |
-
"
|
709 |
-
"
|
710 |
-
"
|
711 |
-
"
|
712 |
-
"
|
713 |
-
"
|
714 |
-
"
|
715 |
-
"
|
716 |
-
"
|
717 |
-
"
|
718 |
-
"
|
719 |
-
"
|
720 |
-
"
|
721 |
-
"
|
722 |
-
"
|
723 |
-
"
|
724 |
-
"
|
725 |
-
"
|
726 |
-
"
|
727 |
-
"
|
728 |
-
"
|
729 |
-
"
|
730 |
-
"
|
731 |
-
"
|
732 |
-
"
|
733 |
-
"
|
734 |
-
"
|
735 |
-
"
|
736 |
-
"
|
737 |
-
"
|
738 |
-
"
|
739 |
-
"
|
740 |
-
"
|
741 |
-
"
|
742 |
-
"
|
743 |
-
"
|
744 |
-
"
|
745 |
-
"
|
746 |
-
"
|
747 |
-
"
|
748 |
-
"
|
749 |
-
"
|
750 |
-
"
|
751 |
-
"
|
752 |
-
"
|
753 |
-
"
|
754 |
-
"
|
755 |
-
"
|
756 |
-
"
|
757 |
-
"
|
758 |
-
"
|
759 |
-
"
|
760 |
-
"
|
761 |
-
"
|
762 |
-
"
|
763 |
-
"
|
764 |
-
"
|
765 |
-
"
|
766 |
-
"
|
767 |
-
"
|
768 |
-
"
|
769 |
-
"
|
770 |
-
"
|
771 |
-
"
|
772 |
-
"
|
773 |
-
"
|
774 |
-
"
|
775 |
-
"
|
776 |
-
"
|
777 |
-
"
|
778 |
-
"
|
779 |
-
"
|
780 |
-
"
|
781 |
-
"
|
782 |
-
"
|
783 |
-
"
|
784 |
-
"
|
785 |
-
"
|
786 |
-
"
|
787 |
-
"
|
788 |
-
"
|
789 |
-
"
|
790 |
-
"
|
791 |
-
"
|
792 |
-
"
|
793 |
-
"
|
794 |
-
"
|
795 |
-
"
|
796 |
-
"
|
797 |
-
"
|
798 |
-
"
|
799 |
-
"
|
800 |
-
"
|
801 |
-
"
|
802 |
-
"
|
803 |
-
"
|
804 |
-
"
|
805 |
-
"
|
806 |
-
"
|
807 |
-
"
|
808 |
-
"
|
809 |
-
"
|
810 |
-
"
|
811 |
-
"
|
812 |
-
"
|
813 |
-
"
|
814 |
-
"
|
815 |
-
"
|
816 |
-
"
|
817 |
-
"
|
818 |
-
"
|
819 |
-
"
|
820 |
-
"
|
821 |
-
"
|
822 |
-
"
|
823 |
-
"
|
824 |
-
"
|
825 |
-
"
|
826 |
-
"
|
827 |
-
"
|
828 |
-
"
|
829 |
-
"
|
830 |
-
"
|
831 |
-
"
|
832 |
-
"
|
833 |
-
"
|
834 |
-
"
|
835 |
-
"
|
836 |
-
"
|
837 |
-
"
|
838 |
-
"
|
839 |
-
"
|
840 |
-
"
|
841 |
-
" 93% 7104/7609 [00:29<00:03, 134.23it/s]\u001b[A\n",
|
842 |
-
" 94% 7118/7609 [00:29<00:03, 132.23it/s]\u001b[A\n",
|
843 |
-
" 94% 7136/7609 [00:29<00:03, 142.38it/s]\u001b[A\n",
|
844 |
-
" 94% 7151/7609 [00:29<00:03, 140.73it/s]\u001b[A\n",
|
845 |
-
" 94% 7167/7609 [00:29<00:03, 145.65it/s]\u001b[A\n",
|
846 |
-
" 94% 7186/7609 [00:29<00:02, 156.49it/s]\u001b[A\n",
|
847 |
-
" 95% 7202/7609 [00:29<00:02, 142.59it/s]\u001b[A\n",
|
848 |
-
" 95% 7222/7609 [00:29<00:02, 155.98it/s]\u001b[A\n",
|
849 |
-
" 95% 7241/7609 [00:30<00:02, 163.57it/s]\u001b[A\n",
|
850 |
-
" 95% 7258/7609 [00:30<00:02, 163.20it/s]\u001b[A\n",
|
851 |
-
" 96% 7276/7609 [00:30<00:01, 167.01it/s]\u001b[A\n",
|
852 |
-
" 96% 7296/7609 [00:30<00:01, 175.67it/s]\u001b[A\n",
|
853 |
-
" 96% 7317/7609 [00:30<00:01, 183.09it/s]\u001b[A\n",
|
854 |
-
" 97% 7345/7609 [00:30<00:01, 210.09it/s]\u001b[A\n",
|
855 |
-
" 97% 7377/7609 [00:30<00:00, 242.02it/s]\u001b[A\n",
|
856 |
-
" 97% 7407/7609 [00:30<00:00, 252.08it/s]\u001b[A\n",
|
857 |
-
" 98% 7434/7609 [00:30<00:00, 256.70it/s]\u001b[A\n",
|
858 |
-
" 98% 7460/7609 [00:30<00:00, 248.40it/s]\u001b[A\n",
|
859 |
-
" 98% 7488/7609 [00:31<00:00, 252.82it/s]\u001b[A\n",
|
860 |
-
" 99% 7514/7609 [00:31<00:00, 248.94it/s]\u001b[A\n",
|
861 |
-
" 99% 7539/7609 [00:31<00:00, 231.82it/s]\u001b[A\n",
|
862 |
-
" 99% 7563/7609 [00:31<00:00, 218.37it/s]\u001b[A\n",
|
863 |
-
"100% 7609/7609 [00:31<00:00, 240.54it/s]\n",
|
864 |
-
"06/01/2023 22:22:13 - INFO - utils_qa - Saving predictions to eval_results/predict_predictions.json.\n",
|
865 |
-
"06/01/2023 22:22:13 - INFO - utils_qa - Saving nbest_preds to eval_results/predict_nbest_predictions.json.\n",
|
866 |
"***** predict metrics *****\n",
|
867 |
" predict_samples = 8565\n",
|
868 |
-
" test_exact_match =
|
869 |
-
" test_f1 = 80.
|
870 |
-
" test_runtime = 0:04:
|
871 |
-
" test_samples_per_second = 29.
|
872 |
-
" test_steps_per_second = 5.
|
873 |
-
"[INFO|modelcard.py:451] 2023-06-
|
874 |
"{'task': {'name': 'Question Answering', 'type': 'question-answering'}, 'dataset': {'name': 'squad_it', 'type': 'squad_it'}}\n",
|
875 |
-
"100% 1713/1713 [05:
|
876 |
]
|
877 |
}
|
878 |
]
|
|
|
34 |
"base_uri": "https://localhost:8080/"
|
35 |
},
|
36 |
"id": "02K9xO6Gvto1",
|
37 |
+
"outputId": "10556608-a497-4c01-e07d-8f95f7ec41ac"
|
38 |
},
|
39 |
"outputs": [
|
40 |
{
|
|
|
43 |
"text": [
|
44 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
45 |
"Collecting git+https://github.com/huggingface/transformers\n",
|
46 |
+
" Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-wnz73n3o\n",
|
47 |
+
" Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-wnz73n3o\n",
|
48 |
+
" Resolved https://github.com/huggingface/transformers to commit 12298cb65c7e9d615b749dde935a0b4966f4ae49\n",
|
49 |
" Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
|
50 |
" Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
|
51 |
" Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
|
52 |
"Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (3.12.0)\n",
|
53 |
"Collecting huggingface-hub<1.0,>=0.14.1 (from transformers==4.30.0.dev0)\n",
|
54 |
" Downloading huggingface_hub-0.15.1-py3-none-any.whl (236 kB)\n",
|
55 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m236.8/236.8 kB\u001b[0m \u001b[31m3.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
56 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (1.22.4)\n",
|
57 |
"Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (23.1)\n",
|
58 |
"Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (6.0)\n",
|
|
|
60 |
"Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (2.27.1)\n",
|
61 |
"Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers==4.30.0.dev0)\n",
|
62 |
" Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n",
|
63 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[31m52.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
64 |
"\u001b[?25hCollecting safetensors>=0.3.1 (from transformers==4.30.0.dev0)\n",
|
65 |
" Downloading safetensors-0.3.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n",
|
66 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m87.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
67 |
"\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers==4.30.0.dev0) (4.65.0)\n",
|
68 |
"Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers==4.30.0.dev0) (2023.4.0)\n",
|
69 |
"Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers==4.30.0.dev0) (4.5.0)\n",
|
|
|
73 |
"Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.30.0.dev0) (3.4)\n",
|
74 |
"Building wheels for collected packages: transformers\n",
|
75 |
" Building wheel for transformers (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
|
76 |
+
" Created wheel for transformers: filename=transformers-4.30.0.dev0-py3-none-any.whl size=7166227 sha256=fdfdc040a7686aacafeef0a3fbf5d6b894a22a4967949ffa981ee09e9f574aac\n",
|
77 |
+
" Stored in directory: /tmp/pip-ephem-wheel-cache-mynbfxj2/wheels/c0/14/d6/6c9a5582d2ac191ec0a483be151a4495fe1eb2a6706ca49f1b\n",
|
78 |
"Successfully built transformers\n",
|
79 |
"Installing collected packages: tokenizers, safetensors, huggingface-hub, transformers\n",
|
80 |
"Successfully installed huggingface-hub-0.15.1 safetensors-0.3.1 tokenizers-0.13.3 transformers-4.30.0.dev0\n"
|
|
|
95 |
"base_uri": "https://localhost:8080/"
|
96 |
},
|
97 |
"id": "VKgybrUswa1q",
|
98 |
+
"outputId": "7f2ad166-68a2-433c-d0b4-8312192dee9e"
|
99 |
},
|
100 |
"execution_count": 2,
|
101 |
"outputs": [
|
|
|
106 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
107 |
"Collecting datasets\n",
|
108 |
" Downloading datasets-2.12.0-py3-none-any.whl (474 kB)\n",
|
109 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m474.6/474.6 kB\u001b[0m \u001b[31m5.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
110 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.22.4)\n",
|
111 |
"Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n",
|
112 |
"Collecting dill<0.3.7,>=0.3.0 (from datasets)\n",
|
113 |
" Downloading dill-0.3.6-py3-none-any.whl (110 kB)\n",
|
114 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.5/110.5 kB\u001b[0m \u001b[31m14.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
115 |
"\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n",
|
116 |
"Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.27.1)\n",
|
117 |
"Requirement already satisfied: tqdm>=4.62.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.65.0)\n",
|
118 |
"Collecting xxhash (from datasets)\n",
|
119 |
" Downloading xxhash-3.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (212 kB)\n",
|
120 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m212.5/212.5 kB\u001b[0m \u001b[31m23.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
121 |
"\u001b[?25hCollecting multiprocess (from datasets)\n",
|
122 |
" Downloading multiprocess-0.70.14-py310-none-any.whl (134 kB)\n",
|
123 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.3/134.3 kB\u001b[0m \u001b[31m17.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
124 |
"\u001b[?25hRequirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.4.0)\n",
|
125 |
"Collecting aiohttp (from datasets)\n",
|
126 |
" Downloading aiohttp-3.8.4-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.0 MB)\n",
|
127 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.0/1.0 MB\u001b[0m \u001b[31m24.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
128 |
"\u001b[?25hRequirement already satisfied: huggingface-hub<1.0.0,>=0.11.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.15.1)\n",
|
129 |
"Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (23.1)\n",
|
130 |
"Collecting responses<0.19 (from datasets)\n",
|
|
|
134 |
"Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (2.0.12)\n",
|
135 |
"Collecting multidict<7.0,>=4.5 (from aiohttp->datasets)\n",
|
136 |
" Downloading multidict-6.0.4-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (114 kB)\n",
|
137 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m114.5/114.5 kB\u001b[0m \u001b[31m14.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
138 |
"\u001b[?25hCollecting async-timeout<5.0,>=4.0.0a3 (from aiohttp->datasets)\n",
|
139 |
" Downloading async_timeout-4.0.2-py3-none-any.whl (5.8 kB)\n",
|
140 |
"Collecting yarl<2.0,>=1.0 (from aiohttp->datasets)\n",
|
141 |
" Downloading yarl-1.9.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (268 kB)\n",
|
142 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m268.8/268.8 kB\u001b[0m \u001b[31m26.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
143 |
"\u001b[?25hCollecting frozenlist>=1.1.1 (from aiohttp->datasets)\n",
|
144 |
" Downloading frozenlist-1.3.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (149 kB)\n",
|
145 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m149.6/149.6 kB\u001b[0m \u001b[31m20.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
146 |
"\u001b[?25hCollecting aiosignal>=1.1.2 (from aiohttp->datasets)\n",
|
147 |
" Downloading aiosignal-1.3.1-py3-none-any.whl (7.6 kB)\n",
|
148 |
"Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (3.12.0)\n",
|
|
|
169 |
"base_uri": "https://localhost:8080/"
|
170 |
},
|
171 |
"id": "xYEW0Hjqz2lo",
|
172 |
+
"outputId": "773d7aa2-0675-4edf-cb7e-34046a4fba55"
|
173 |
},
|
174 |
"execution_count": 3,
|
175 |
"outputs": [
|
|
|
179 |
"text": [
|
180 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
181 |
"Collecting accelerate\n",
|
182 |
+
" Downloading accelerate-0.20.0-py3-none-any.whl (227 kB)\n",
|
183 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m227.4/227.4 kB\u001b[0m \u001b[31m3.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
184 |
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate) (1.22.4)\n",
|
185 |
"Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (23.1)\n",
|
186 |
"Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n",
|
|
|
197 |
"Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.6.0->accelerate) (2.1.2)\n",
|
198 |
"Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.6.0->accelerate) (1.3.0)\n",
|
199 |
"Installing collected packages: accelerate\n",
|
200 |
+
"Successfully installed accelerate-0.20.0\n"
|
201 |
]
|
202 |
}
|
203 |
]
|
|
|
212 |
"base_uri": "https://localhost:8080/"
|
213 |
},
|
214 |
"id": "9OFz3JdR0cQ_",
|
215 |
+
"outputId": "202b4d5c-8d48-4f01-c760-9bfb413fbb30"
|
216 |
},
|
217 |
"execution_count": 4,
|
218 |
"outputs": [
|
|
|
223 |
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
|
224 |
"Collecting evaluate\n",
|
225 |
" Downloading evaluate-0.4.0-py3-none-any.whl (81 kB)\n",
|
226 |
+
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m81.4/81.4 kB\u001b[0m \u001b[31m2.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
|
227 |
"\u001b[?25hRequirement already satisfied: datasets>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from evaluate) (2.12.0)\n",
|
228 |
"Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from evaluate) (1.22.4)\n",
|
229 |
"Requirement already satisfied: dill in /usr/local/lib/python3.10/dist-packages (from evaluate) (0.3.6)\n",
|
|
|
272 |
"base_uri": "https://localhost:8080/"
|
273 |
},
|
274 |
"id": "JJhpBNwpxOTK",
|
275 |
+
"outputId": "bbb60e1c-bde4-49b0-bfb2-eaf01cbcad29"
|
276 |
},
|
277 |
"execution_count": 5,
|
278 |
"outputs": [
|
|
|
280 |
"output_type": "stream",
|
281 |
"name": "stdout",
|
282 |
"text": [
|
283 |
+
"--2023-06-07 16:47:01-- https://raw.githubusercontent.com/huggingface/transformers/main/examples/pytorch/question-answering/run_qa.py\n",
|
284 |
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.108.133, 185.199.109.133, 185.199.110.133, ...\n",
|
285 |
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.108.133|:443... connected.\n",
|
286 |
"HTTP request sent, awaiting response... 200 OK\n",
|
287 |
"Length: 31717 (31K) [text/plain]\n",
|
288 |
"Saving to: ‘run_qa.py’\n",
|
289 |
"\n",
|
290 |
+
"run_qa.py 100%[===================>] 30.97K --.-KB/s in 0.006s \n",
|
291 |
"\n",
|
292 |
+
"2023-06-07 16:47:01 (5.21 MB/s) - ‘run_qa.py’ saved [31717/31717]\n",
|
293 |
"\n",
|
294 |
+
"--2023-06-07 16:47:02-- https://raw.githubusercontent.com/huggingface/transformers/main/examples/pytorch/question-answering/trainer_qa.py\n",
|
295 |
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.108.133, 185.199.109.133, 185.199.110.133, ...\n",
|
296 |
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.108.133|:443... connected.\n",
|
297 |
"HTTP request sent, awaiting response... 200 OK\n",
|
|
|
300 |
"\n",
|
301 |
"trainer_qa.py 100%[===================>] 6.11K --.-KB/s in 0s \n",
|
302 |
"\n",
|
303 |
+
"2023-06-07 16:47:02 (87.1 MB/s) - ‘trainer_qa.py’ saved [6253/6253]\n",
|
304 |
"\n",
|
305 |
+
"--2023-06-07 16:47:02-- https://raw.githubusercontent.com/huggingface/transformers/main/examples/pytorch/question-answering/utils_qa.py\n",
|
306 |
+
"Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.110.133, 185.199.109.133, 185.199.111.133, ...\n",
|
307 |
+
"Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.110.133|:443... connected.\n",
|
308 |
"HTTP request sent, awaiting response... 200 OK\n",
|
309 |
"Length: 22777 (22K) [text/plain]\n",
|
310 |
"Saving to: ‘utils_qa.py’\n",
|
311 |
"\n",
|
312 |
+
"utils_qa.py 100%[===================>] 22.24K --.-KB/s in 0.004s \n",
|
313 |
"\n",
|
314 |
+
"2023-06-07 16:47:02 (4.95 MB/s) - ‘utils_qa.py’ saved [22777/22777]\n",
|
315 |
"\n"
|
316 |
]
|
317 |
}
|
|
|
327 |
"base_uri": "https://localhost:8080/"
|
328 |
},
|
329 |
"id": "Loa6y9XqzXJ4",
|
330 |
+
"outputId": "3be368ce-5d9e-4df2-c3c9-f6a5a537c405"
|
331 |
},
|
332 |
"execution_count": 6,
|
333 |
"outputs": [
|
|
|
361 |
"base_uri": "https://localhost:8080/"
|
362 |
},
|
363 |
"id": "B5O5Lom8x_c4",
|
364 |
+
"outputId": "ebb24d93-3e0c-4eae-ca30-28d1c9a46bc6"
|
365 |
},
|
366 |
"execution_count": 8,
|
367 |
"outputs": [
|
|
|
369 |
"output_type": "stream",
|
370 |
"name": "stdout",
|
371 |
"text": [
|
372 |
+
"2023-06-07 16:47:10.607285: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
|
373 |
+
"06/07/2023 16:47:13 - WARNING - __main__ - Process rank: 0, device: cuda:0, n_gpu: 1distributed training: True, 16-bits training: False\n",
|
374 |
+
"06/07/2023 16:47:13 - INFO - __main__ - Training/evaluation parameters TrainingArguments(\n",
|
375 |
"_n_gpu=1,\n",
|
376 |
"adafactor=False,\n",
|
377 |
"adam_beta1=0.9,\n",
|
|
|
428 |
"log_level=passive,\n",
|
429 |
"log_level_replica=warning,\n",
|
430 |
"log_on_each_node=True,\n",
|
431 |
+
"logging_dir=eval_results/runs/Jun07_16-47-13_0d4f01f1a5fc,\n",
|
432 |
"logging_first_step=False,\n",
|
433 |
"logging_nan_inf_filter=True,\n",
|
434 |
"logging_steps=500,\n",
|
|
|
480 |
"weight_decay=0.0,\n",
|
481 |
"xpu_backend=None,\n",
|
482 |
")\n",
|
483 |
+
"06/07/2023 16:47:13 - INFO - datasets.utils.file_utils - https://huggingface.co/datasets/squad_it/resolve/main/squad_it.py not found in cache or force_download set to True, downloading to /root/.cache/huggingface/datasets/downloads/tmp6fvibkw8\n",
|
484 |
+
"Downloading builder script: 100% 4.74k/4.74k [00:00<00:00, 6.03MB/s]\n",
|
485 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - storing https://huggingface.co/datasets/squad_it/resolve/main/squad_it.py in cache at /root/.cache/huggingface/datasets/downloads/2f7a246f661e6acb3a9ad072ed14241ea343265e7d863b88717897941c3ab1dd.671c3c3daf2f05e0355b498b0f5a7f2167fa94dc6de36195fe1ba0503e6dcc30.py\n",
|
486 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - creating metadata file for /root/.cache/huggingface/datasets/downloads/2f7a246f661e6acb3a9ad072ed14241ea343265e7d863b88717897941c3ab1dd.671c3c3daf2f05e0355b498b0f5a7f2167fa94dc6de36195fe1ba0503e6dcc30.py\n",
|
487 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - https://huggingface.co/datasets/squad_it/resolve/main/dataset_infos.json not found in cache or force_download set to True, downloading to /root/.cache/huggingface/datasets/downloads/tmpax6jsbgs\n",
|
488 |
+
"Downloading metadata: 100% 2.51k/2.51k [00:00<00:00, 2.96MB/s]\n",
|
489 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - storing https://huggingface.co/datasets/squad_it/resolve/main/dataset_infos.json in cache at /root/.cache/huggingface/datasets/downloads/f6d7650a1e4a9f0e42b54f34ac614f7c1142ad26c1bd19a448eb606fe09f7515.b459489a7b1a4d859decbeef851034c7846ef6cce8ec2cf192cf4b4f40d0865d\n",
|
490 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - creating metadata file for /root/.cache/huggingface/datasets/downloads/f6d7650a1e4a9f0e42b54f34ac614f7c1142ad26c1bd19a448eb606fe09f7515.b459489a7b1a4d859decbeef851034c7846ef6cce8ec2cf192cf4b4f40d0865d\n",
|
491 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - https://huggingface.co/datasets/squad_it/resolve/main/README.md not found in cache or force_download set to True, downloading to /root/.cache/huggingface/datasets/downloads/tmpmy7om6r1\n",
|
492 |
+
"Downloading readme: 100% 7.27k/7.27k [00:00<00:00, 9.54MB/s]\n",
|
493 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - storing https://huggingface.co/datasets/squad_it/resolve/main/README.md in cache at /root/.cache/huggingface/datasets/downloads/b664892e5965a1ef2e173eadc7e9cbf6ad4aeb6240d7b3bb6ab9f32850363a6f.71fe7dbf5f3b574d85b57b5a722ebc49fe8ec8b03d655344891fb1b05c4634fb\n",
|
494 |
+
"06/07/2023 16:47:14 - INFO - datasets.utils.file_utils - creating metadata file for /root/.cache/huggingface/datasets/downloads/b664892e5965a1ef2e173eadc7e9cbf6ad4aeb6240d7b3bb6ab9f32850363a6f.71fe7dbf5f3b574d85b57b5a722ebc49fe8ec8b03d655344891fb1b05c4634fb\n",
|
495 |
+
"06/07/2023 16:47:14 - INFO - datasets.info - Loading Dataset Infos from /root/.cache/huggingface/modules/datasets_modules/datasets/squad_it/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71\n",
|
496 |
+
"06/07/2023 16:47:14 - INFO - datasets.builder - Generating dataset squad_it (/root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71)\n",
|
497 |
"Downloading and preparing dataset squad_it/default to /root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71...\n",
|
498 |
+
"06/07/2023 16:47:14 - INFO - datasets.builder - Dataset not on Hf google storage. Downloading and preparing it from source\n",
|
499 |
+
"Downloading data files: 0% 0/2 [00:00<?, ?it/s]06/07/2023 16:47:15 - INFO - datasets.utils.file_utils - https://github.com/crux82/squad-it/raw/master/SQuAD_it-train.json.gz not found in cache or force_download set to True, downloading to /root/.cache/huggingface/datasets/downloads/tmpsh92z3dw\n",
|
500 |
"\n",
|
501 |
"Downloading data: 0% 0.00/7.73M [00:00<?, ?B/s]\u001b[A\n",
|
502 |
+
"Downloading data: 100% 7.73M/7.73M [00:00<00:00, 40.9MB/s]\n",
|
503 |
+
"06/07/2023 16:47:15 - INFO - datasets.utils.file_utils - storing https://github.com/crux82/squad-it/raw/master/SQuAD_it-train.json.gz in cache at /root/.cache/huggingface/datasets/downloads/44ac0548c3284061d1356ff7f5212fe42b923b0aa0854c886ce93dfeb7ab629b\n",
|
504 |
+
"06/07/2023 16:47:15 - INFO - datasets.utils.file_utils - creating metadata file for /root/.cache/huggingface/datasets/downloads/44ac0548c3284061d1356ff7f5212fe42b923b0aa0854c886ce93dfeb7ab629b\n",
|
505 |
+
"Downloading data files: 50% 1/2 [00:00<00:00, 1.03it/s]06/07/2023 16:47:16 - INFO - datasets.utils.file_utils - https://github.com/crux82/squad-it/raw/master/SQuAD_it-test.json.gz not found in cache or force_download set to True, downloading to /root/.cache/huggingface/datasets/downloads/tmp99vaamp8\n",
|
506 |
"\n",
|
507 |
+
"Downloading data: 0% 0.00/1.05M [00:00<?, ?B/s]\u001b[A\n",
|
508 |
+
"Downloading data: 100% 1.05M/1.05M [00:00<00:00, 10.1MB/s]\n",
|
509 |
+
"06/07/2023 16:47:16 - INFO - datasets.utils.file_utils - storing https://github.com/crux82/squad-it/raw/master/SQuAD_it-test.json.gz in cache at /root/.cache/huggingface/datasets/downloads/e560a4a54eb929ce542e945627942afca80859dcbf499866a59984eb9026d31f\n",
|
510 |
+
"06/07/2023 16:47:16 - INFO - datasets.utils.file_utils - creating metadata file for /root/.cache/huggingface/datasets/downloads/e560a4a54eb929ce542e945627942afca80859dcbf499866a59984eb9026d31f\n",
|
511 |
+
"Downloading data files: 100% 2/2 [00:01<00:00, 1.13it/s]\n",
|
512 |
+
"06/07/2023 16:47:16 - INFO - datasets.download.download_manager - Downloading took 0.0 min\n",
|
513 |
+
"06/07/2023 16:47:16 - INFO - datasets.download.download_manager - Checksum Computation took 0.0 min\n",
|
514 |
+
"Extracting data files: 100% 2/2 [00:00<00:00, 8.64it/s]\n",
|
515 |
+
"06/07/2023 16:47:16 - INFO - datasets.builder - Generating train split\n",
|
516 |
+
"06/07/2023 16:47:22 - INFO - datasets.builder - Generating test split\n",
|
517 |
+
"06/07/2023 16:47:23 - INFO - datasets.utils.info_utils - All the splits matched successfully.\n",
|
518 |
"Dataset squad_it downloaded and prepared to /root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71. Subsequent calls will reuse this data.\n",
|
519 |
+
"100% 2/2 [00:00<00:00, 542.64it/s]\n",
|
520 |
+
"Downloading (…)lve/main/config.json: 100% 826/826 [00:00<00:00, 5.76MB/s]\n",
|
521 |
+
"[INFO|configuration_utils.py:669] 2023-06-07 16:47:23,846 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--osiria--deberta-italian-question-answering/snapshots/e93341adad1d2140bacd231c54d7c3e0fd1317c3/config.json\n",
|
522 |
+
"[INFO|configuration_utils.py:725] 2023-06-07 16:47:23,850 >> Model config DebertaV2Config {\n",
|
523 |
" \"_name_or_path\": \"osiria/deberta-italian-question-answering\",\n",
|
524 |
" \"architectures\": [\n",
|
525 |
" \"DebertaV2ForQuestionAnswering\"\n",
|
|
|
555 |
" \"vocab_size\": 50256\n",
|
556 |
"}\n",
|
557 |
"\n",
|
558 |
+
"Downloading (…)okenizer_config.json: 100% 412/412 [00:00<00:00, 2.41MB/s]\n",
|
559 |
+
"Downloading (…)/main/tokenizer.json: 100% 2.02M/2.02M [00:00<00:00, 12.6MB/s]\n",
|
560 |
+
"[INFO|tokenization_utils_base.py:1823] 2023-06-07 16:47:24,622 >> loading file spm.model from cache at None\n",
|
561 |
+
"[INFO|tokenization_utils_base.py:1823] 2023-06-07 16:47:24,622 >> loading file tokenizer.json from cache at /root/.cache/huggingface/hub/models--osiria--deberta-italian-question-answering/snapshots/e93341adad1d2140bacd231c54d7c3e0fd1317c3/tokenizer.json\n",
|
562 |
+
"[INFO|tokenization_utils_base.py:1823] 2023-06-07 16:47:24,622 >> loading file added_tokens.json from cache at None\n",
|
563 |
+
"[INFO|tokenization_utils_base.py:1823] 2023-06-07 16:47:24,622 >> loading file special_tokens_map.json from cache at None\n",
|
564 |
+
"[INFO|tokenization_utils_base.py:1823] 2023-06-07 16:47:24,622 >> loading file tokenizer_config.json from cache at /root/.cache/huggingface/hub/models--osiria--deberta-italian-question-answering/snapshots/e93341adad1d2140bacd231c54d7c3e0fd1317c3/tokenizer_config.json\n",
|
565 |
+
"Downloading pytorch_model.bin: 100% 496M/496M [00:07<00:00, 66.0MB/s]\n",
|
566 |
+
"[INFO|modeling_utils.py:2578] 2023-06-07 16:47:32,789 >> loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--osiria--deberta-italian-question-answering/snapshots/e93341adad1d2140bacd231c54d7c3e0fd1317c3/pytorch_model.bin\n",
|
567 |
+
"[INFO|modeling_utils.py:3295] 2023-06-07 16:47:34,943 >> All model checkpoint weights were used when initializing DebertaV2ForQuestionAnswering.\n",
|
568 |
"\n",
|
569 |
+
"[INFO|modeling_utils.py:3303] 2023-06-07 16:47:34,943 >> All the weights of DebertaV2ForQuestionAnswering were initialized from the model checkpoint at osiria/deberta-italian-question-answering.\n",
|
570 |
"If your task is similar to the task the model of the checkpoint was trained on, you can already use DebertaV2ForQuestionAnswering for predictions without further training.\n",
|
571 |
+
"Running tokenizer on prediction dataset: 0% 0/7609 [00:00<?, ? examples/s]06/07/2023 16:47:36 - INFO - datasets.arrow_dataset - Caching processed dataset at /root/.cache/huggingface/datasets/squad_it/default/0.1.0/d442bdb4794b4bae227ab19105b76d706ed7cf2ac342e4c9da4a5c36bde19d71/cache-c70dd3f912ae21c4.arrow\n",
|
572 |
+
"Downloading builder script: 100% 4.53k/4.53k [00:00<00:00, 4.58MB/s]\n",
|
573 |
+
"Downloading extra modules: 100% 3.32k/3.32k [00:00<00:00, 3.72MB/s]\n",
|
574 |
+
"06/07/2023 16:47:48 - INFO - __main__ - *** Predict ***\n",
|
575 |
+
"[INFO|trainer.py:774] 2023-06-07 16:47:48,896 >> The following columns in the test set don't have a corresponding argument in `DebertaV2ForQuestionAnswering.forward` and have been ignored: offset_mapping, example_id. If offset_mapping, example_id are not expected by `DebertaV2ForQuestionAnswering.forward`, you can safely ignore this message.\n",
|
576 |
+
"[INFO|trainer.py:3163] 2023-06-07 16:47:48,899 >> ***** Running Prediction *****\n",
|
577 |
+
"[INFO|trainer.py:3165] 2023-06-07 16:47:48,899 >> Num examples = 8565\n",
|
578 |
+
"[INFO|trainer.py:3168] 2023-06-07 16:47:48,899 >> Batch size = 5\n",
|
579 |
+
"100% 1713/1713 [04:44<00:00, 5.97it/s]06/07/2023 16:52:48 - INFO - utils_qa - Post-processing 7609 example predictions split into 8565 features.\n",
|
580 |
"\n",
|
581 |
" 0% 0/7609 [00:00<?, ?it/s]\u001b[A\n",
|
582 |
+
" 0% 31/7609 [00:00<00:24, 303.25it/s]\u001b[A\n",
|
583 |
+
" 1% 63/7609 [00:00<00:24, 307.26it/s]\u001b[A\n",
|
584 |
+
" 1% 94/7609 [00:00<00:24, 303.34it/s]\u001b[A\n",
|
585 |
+
" 2% 129/7609 [00:00<00:23, 318.34it/s]\u001b[A\n",
|
586 |
+
" 2% 162/7609 [00:00<00:23, 320.97it/s]\u001b[A\n",
|
587 |
+
" 3% 195/7609 [00:00<00:23, 321.01it/s]\u001b[A\n",
|
588 |
+
" 3% 232/7609 [00:00<00:21, 335.66it/s]\u001b[A\n",
|
589 |
+
" 3% 266/7609 [00:00<00:21, 334.20it/s]\u001b[A\n",
|
590 |
+
" 4% 300/7609 [00:00<00:22, 318.84it/s]\u001b[A\n",
|
591 |
+
" 4% 333/7609 [00:01<00:23, 311.86it/s]\u001b[A\n",
|
592 |
+
" 5% 365/7609 [00:01<00:23, 303.43it/s]\u001b[A\n",
|
593 |
+
" 5% 401/7609 [00:01<00:22, 317.40it/s]\u001b[A\n",
|
594 |
+
" 6% 434/7609 [00:01<00:22, 319.56it/s]\u001b[A\n",
|
595 |
+
" 6% 470/7609 [00:01<00:21, 330.55it/s]\u001b[A\n",
|
596 |
+
" 7% 504/7609 [00:01<00:23, 307.96it/s]\u001b[A\n",
|
597 |
+
" 7% 536/7609 [00:01<00:24, 285.18it/s]\u001b[A\n",
|
598 |
+
" 7% 568/7609 [00:01<00:23, 293.60it/s]\u001b[A\n",
|
599 |
+
" 8% 604/7609 [00:01<00:22, 310.55it/s]\u001b[A\n",
|
600 |
+
" 8% 639/7609 [00:02<00:21, 320.12it/s]\u001b[A\n",
|
601 |
+
" 9% 673/7609 [00:02<00:21, 323.88it/s]\u001b[A\n",
|
602 |
+
" 9% 709/7609 [00:02<00:20, 331.99it/s]\u001b[A\n",
|
603 |
+
" 10% 743/7609 [00:02<00:20, 329.46it/s]\u001b[A\n",
|
604 |
+
" 10% 777/7609 [00:02<00:20, 329.40it/s]\u001b[A\n",
|
605 |
+
" 11% 811/7609 [00:02<00:22, 306.52it/s]\u001b[A\n",
|
606 |
+
" 11% 843/7609 [00:02<00:22, 297.72it/s]\u001b[A\n",
|
607 |
+
" 11% 875/7609 [00:02<00:22, 303.71it/s]\u001b[A\n",
|
608 |
+
" 12% 910/7609 [00:02<00:21, 316.04it/s]\u001b[A\n",
|
609 |
+
" 12% 945/7609 [00:02<00:20, 323.67it/s]\u001b[A\n",
|
610 |
+
" 13% 978/7609 [00:03<00:20, 318.32it/s]\u001b[A\n",
|
611 |
+
" 13% 1014/7609 [00:03<00:20, 327.90it/s]\u001b[A\n",
|
612 |
+
" 14% 1049/7609 [00:03<00:19, 332.85it/s]\u001b[A\n",
|
613 |
+
" 14% 1085/7609 [00:03<00:19, 339.69it/s]\u001b[A\n",
|
614 |
+
" 15% 1120/7609 [00:03<00:20, 313.00it/s]\u001b[A\n",
|
615 |
+
" 15% 1152/7609 [00:03<00:21, 299.88it/s]\u001b[A\n",
|
616 |
+
" 16% 1183/7609 [00:03<00:21, 296.07it/s]\u001b[A\n",
|
617 |
+
" 16% 1219/7609 [00:03<00:20, 312.27it/s]\u001b[A\n",
|
618 |
+
" 16% 1255/7609 [00:03<00:19, 325.08it/s]\u001b[A\n",
|
619 |
+
" 17% 1293/7609 [00:04<00:18, 336.93it/s]\u001b[A\n",
|
620 |
+
" 17% 1328/7609 [00:04<00:18, 338.57it/s]\u001b[A\n",
|
621 |
+
" 18% 1363/7609 [00:04<00:18, 340.16it/s]\u001b[A\n",
|
622 |
+
" 18% 1398/7609 [00:04<00:20, 300.47it/s]\u001b[A\n",
|
623 |
+
" 19% 1429/7609 [00:04<00:20, 302.31it/s]\u001b[A\n",
|
624 |
+
" 19% 1460/7609 [00:04<00:21, 284.58it/s]\u001b[A\n",
|
625 |
+
" 20% 1490/7609 [00:04<00:22, 272.85it/s]\u001b[A\n",
|
626 |
+
" 20% 1519/7609 [00:04<00:22, 274.45it/s]\u001b[A\n",
|
627 |
+
" 20% 1553/7609 [00:04<00:20, 290.63it/s]\u001b[A\n",
|
628 |
+
" 21% 1586/7609 [00:05<00:20, 300.36it/s]\u001b[A\n",
|
629 |
+
" 21% 1617/7609 [00:05<00:21, 281.28it/s]\u001b[A\n",
|
630 |
+
" 22% 1646/7609 [00:05<00:21, 281.66it/s]\u001b[A\n",
|
631 |
+
" 22% 1675/7609 [00:05<00:22, 263.57it/s]\u001b[A\n",
|
632 |
+
" 22% 1702/7609 [00:05<00:25, 227.69it/s]\u001b[A\n",
|
633 |
+
" 23% 1726/7609 [00:05<00:26, 218.54it/s]\u001b[A\n",
|
634 |
+
" 23% 1749/7609 [00:05<00:27, 213.80it/s]\u001b[A\n",
|
635 |
+
" 23% 1771/7609 [00:05<00:31, 185.78it/s]\u001b[A\n",
|
636 |
+
" 24% 1791/7609 [00:06<00:33, 175.38it/s]\u001b[A\n",
|
637 |
+
" 24% 1810/7609 [00:06<00:33, 173.38it/s]\u001b[A\n",
|
638 |
+
" 24% 1828/7609 [00:06<00:35, 161.63it/s]\u001b[A\n",
|
639 |
+
" 24% 1845/7609 [00:06<00:35, 161.26it/s]\u001b[A\n",
|
640 |
+
" 24% 1862/7609 [00:06<00:35, 163.22it/s]\u001b[A\n",
|
641 |
+
" 25% 1879/7609 [00:06<00:34, 164.44it/s]\u001b[A\n",
|
642 |
+
" 25% 1896/7609 [00:06<00:35, 162.09it/s]\u001b[A\n",
|
643 |
+
" 25% 1913/7609 [00:06<00:35, 158.55it/s]\u001b[A\n",
|
644 |
+
" 25% 1931/7609 [00:07<00:34, 162.40it/s]\u001b[A\n",
|
645 |
+
" 26% 1950/7609 [00:07<00:34, 164.90it/s]\u001b[A\n",
|
646 |
+
" 26% 1967/7609 [00:07<00:42, 131.44it/s]\u001b[A\n",
|
647 |
+
" 26% 1982/7609 [00:07<00:44, 125.12it/s]\u001b[A\n",
|
648 |
+
" 26% 1996/7609 [00:07<00:49, 114.26it/s]\u001b[A\n",
|
649 |
+
" 26% 2009/7609 [00:07<00:53, 104.66it/s]\u001b[A\n",
|
650 |
+
" 27% 2020/7609 [00:07<01:00, 92.58it/s] \u001b[A\n",
|
651 |
+
" 27% 2030/7609 [00:08<01:01, 91.17it/s]\u001b[A\n",
|
652 |
+
" 27% 2043/7609 [00:08<00:56, 99.17it/s]\u001b[A\n",
|
653 |
+
" 27% 2060/7609 [00:08<00:47, 115.87it/s]\u001b[A\n",
|
654 |
+
" 27% 2073/7609 [00:08<01:02, 88.21it/s] \u001b[A\n",
|
655 |
+
" 27% 2084/7609 [00:08<01:13, 75.15it/s]\u001b[A\n",
|
656 |
+
" 28% 2093/7609 [00:08<01:15, 73.17it/s]\u001b[A\n",
|
657 |
+
" 28% 2102/7609 [00:09<01:27, 62.94it/s]\u001b[A\n",
|
658 |
+
" 28% 2121/7609 [00:09<01:02, 88.09it/s]\u001b[A\n",
|
659 |
+
" 28% 2143/7609 [00:09<00:47, 115.89it/s]\u001b[A\n",
|
660 |
+
" 28% 2164/7609 [00:09<00:39, 137.76it/s]\u001b[A\n",
|
661 |
+
" 29% 2183/7609 [00:09<00:36, 150.34it/s]\u001b[A\n",
|
662 |
+
" 29% 2204/7609 [00:09<00:32, 165.87it/s]\u001b[A\n",
|
663 |
+
" 29% 2230/7609 [00:09<00:28, 190.59it/s]\u001b[A\n",
|
664 |
+
" 30% 2254/7609 [00:09<00:26, 203.95it/s]\u001b[A\n",
|
665 |
+
" 30% 2284/7609 [00:09<00:23, 230.75it/s]\u001b[A\n",
|
666 |
+
" 30% 2317/7609 [00:09<00:20, 257.80it/s]\u001b[A\n",
|
667 |
+
" 31% 2351/7609 [00:10<00:18, 281.05it/s]\u001b[A\n",
|
668 |
+
" 31% 2381/7609 [00:10<00:18, 286.24it/s]\u001b[A\n",
|
669 |
+
" 32% 2415/7609 [00:10<00:17, 301.26it/s]\u001b[A\n",
|
670 |
+
" 32% 2449/7609 [00:10<00:16, 308.37it/s]\u001b[A\n",
|
671 |
+
" 33% 2480/7609 [00:10<00:18, 280.50it/s]\u001b[A\n",
|
672 |
+
" 33% 2512/7609 [00:10<00:17, 289.91it/s]\u001b[A\n",
|
673 |
+
" 33% 2542/7609 [00:10<00:17, 292.21it/s]\u001b[A\n",
|
674 |
+
" 34% 2574/7609 [00:10<00:16, 298.20it/s]\u001b[A\n",
|
675 |
+
" 34% 2605/7609 [00:10<00:17, 278.61it/s]\u001b[A\n",
|
676 |
+
" 35% 2635/7609 [00:11<00:17, 281.15it/s]\u001b[A\n",
|
677 |
+
" 35% 2669/7609 [00:11<00:16, 296.96it/s]\u001b[A\n",
|
678 |
+
" 35% 2701/7609 [00:11<00:16, 302.08it/s]\u001b[A\n",
|
679 |
+
" 36% 2732/7609 [00:11<00:16, 302.15it/s]\u001b[A\n",
|
680 |
+
" 36% 2764/7609 [00:11<00:15, 305.76it/s]\u001b[A\n",
|
681 |
+
" 37% 2797/7609 [00:11<00:15, 312.07it/s]\u001b[A\n",
|
682 |
+
" 37% 2829/7609 [00:11<00:15, 311.10it/s]\u001b[A\n",
|
683 |
+
" 38% 2861/7609 [00:11<00:15, 313.11it/s]\u001b[A\n",
|
684 |
+
" 38% 2893/7609 [00:11<00:14, 314.97it/s]\u001b[A\n",
|
685 |
+
" 38% 2929/7609 [00:11<00:14, 328.02it/s]\u001b[A\n",
|
686 |
+
" 39% 2965/7609 [00:12<00:13, 335.60it/s]\u001b[A\n",
|
687 |
+
" 39% 2999/7609 [00:12<00:14, 311.13it/s]\u001b[A\n",
|
688 |
+
" 40% 3031/7609 [00:12<00:15, 300.91it/s]\u001b[A\n",
|
689 |
+
" 40% 3064/7609 [00:12<00:14, 308.83it/s]\u001b[A\n",
|
690 |
+
" 41% 3096/7609 [00:12<00:14, 310.64it/s]\u001b[A\n",
|
691 |
+
" 41% 3128/7609 [00:12<00:14, 298.83it/s]\u001b[A\n",
|
692 |
+
" 42% 3162/7609 [00:12<00:14, 309.13it/s]\u001b[A\n",
|
693 |
+
" 42% 3194/7609 [00:12<00:15, 277.97it/s]\u001b[A\n",
|
694 |
+
" 42% 3223/7609 [00:12<00:16, 264.49it/s]\u001b[A\n",
|
695 |
+
" 43% 3257/7609 [00:13<00:15, 284.09it/s]\u001b[A\n",
|
696 |
+
" 43% 3290/7609 [00:13<00:14, 294.71it/s]\u001b[A\n",
|
697 |
+
" 44% 3320/7609 [00:13<00:14, 293.52it/s]\u001b[A\n",
|
698 |
+
" 44% 3350/7609 [00:13<00:14, 288.16it/s]\u001b[A\n",
|
699 |
+
" 44% 3386/7609 [00:13<00:13, 306.68it/s]\u001b[A\n",
|
700 |
+
" 45% 3418/7609 [00:13<00:13, 308.84it/s]\u001b[A\n",
|
701 |
+
" 45% 3450/7609 [00:13<00:13, 311.26it/s]\u001b[A\n",
|
702 |
+
" 46% 3486/7609 [00:13<00:12, 325.33it/s]\u001b[A\n",
|
703 |
+
" 46% 3519/7609 [00:13<00:12, 326.31it/s]\u001b[A\n",
|
704 |
+
" 47% 3552/7609 [00:13<00:12, 320.66it/s]\u001b[A\n",
|
705 |
+
" 47% 3585/7609 [00:14<00:12, 316.53it/s]\u001b[A\n",
|
706 |
+
" 48% 3617/7609 [00:14<00:12, 311.52it/s]\u001b[A\n",
|
707 |
+
" 48% 3649/7609 [00:14<00:13, 303.36it/s]\u001b[A\n",
|
708 |
+
" 48% 3684/7609 [00:14<00:12, 314.49it/s]\u001b[A\n",
|
709 |
+
" 49% 3719/7609 [00:14<00:11, 324.33it/s]\u001b[A\n",
|
710 |
+
" 49% 3753/7609 [00:14<00:11, 326.51it/s]\u001b[A\n",
|
711 |
+
" 50% 3786/7609 [00:14<00:12, 312.75it/s]\u001b[A\n",
|
712 |
+
" 50% 3818/7609 [00:14<00:12, 308.95it/s]\u001b[A\n",
|
713 |
+
" 51% 3853/7609 [00:14<00:11, 319.23it/s]\u001b[A\n",
|
714 |
+
" 51% 3890/7609 [00:15<00:11, 331.91it/s]\u001b[A\n",
|
715 |
+
" 52% 3925/7609 [00:15<00:10, 334.96it/s]\u001b[A\n",
|
716 |
+
" 52% 3959/7609 [00:15<00:10, 332.60it/s]\u001b[A\n",
|
717 |
+
" 52% 3993/7609 [00:15<00:11, 322.10it/s]\u001b[A\n",
|
718 |
+
" 53% 4026/7609 [00:15<00:11, 315.63it/s]\u001b[A\n",
|
719 |
+
" 53% 4058/7609 [00:15<00:11, 316.47it/s]\u001b[A\n",
|
720 |
+
" 54% 4090/7609 [00:15<00:12, 282.73it/s]\u001b[A\n",
|
721 |
+
" 54% 4122/7609 [00:15<00:11, 291.59it/s]\u001b[A\n",
|
722 |
+
" 55% 4155/7609 [00:15<00:11, 300.32it/s]\u001b[A\n",
|
723 |
+
" 55% 4186/7609 [00:16<00:11, 302.40it/s]\u001b[A\n",
|
724 |
+
" 55% 4217/7609 [00:16<00:11, 289.82it/s]\u001b[A\n",
|
725 |
+
" 56% 4251/7609 [00:16<00:11, 302.39it/s]\u001b[A\n",
|
726 |
+
" 56% 4285/7609 [00:16<00:10, 312.34it/s]\u001b[A\n",
|
727 |
+
" 57% 4317/7609 [00:16<00:11, 294.79it/s]\u001b[A\n",
|
728 |
+
" 57% 4348/7609 [00:16<00:10, 297.31it/s]\u001b[A\n",
|
729 |
+
" 58% 4383/7609 [00:16<00:10, 311.51it/s]\u001b[A\n",
|
730 |
+
" 58% 4418/7609 [00:16<00:09, 321.76it/s]\u001b[A\n",
|
731 |
+
" 58% 4451/7609 [00:16<00:10, 303.74it/s]\u001b[A\n",
|
732 |
+
" 59% 4487/7609 [00:16<00:09, 318.32it/s]\u001b[A\n",
|
733 |
+
" 59% 4521/7609 [00:17<00:09, 324.18it/s]\u001b[A\n",
|
734 |
+
" 60% 4554/7609 [00:17<00:09, 308.89it/s]\u001b[A\n",
|
735 |
+
" 60% 4589/7609 [00:17<00:09, 319.64it/s]\u001b[A\n",
|
736 |
+
" 61% 4625/7609 [00:17<00:09, 329.94it/s]\u001b[A\n",
|
737 |
+
" 61% 4662/7609 [00:17<00:08, 341.53it/s]\u001b[A\n",
|
738 |
+
" 62% 4697/7609 [00:17<00:08, 338.88it/s]\u001b[A\n",
|
739 |
+
" 62% 4735/7609 [00:17<00:08, 349.33it/s]\u001b[A\n",
|
740 |
+
" 63% 4771/7609 [00:17<00:08, 344.86it/s]\u001b[A\n",
|
741 |
+
" 63% 4806/7609 [00:17<00:08, 336.05it/s]\u001b[A\n",
|
742 |
+
" 64% 4840/7609 [00:18<00:08, 337.05it/s]\u001b[A\n",
|
743 |
+
" 64% 4874/7609 [00:18<00:08, 337.75it/s]\u001b[A\n",
|
744 |
+
" 65% 4908/7609 [00:18<00:08, 336.24it/s]\u001b[A\n",
|
745 |
+
" 65% 4942/7609 [00:18<00:07, 337.21it/s]\u001b[A\n",
|
746 |
+
" 65% 4976/7609 [00:18<00:08, 312.17it/s]\u001b[A\n",
|
747 |
+
" 66% 5009/7609 [00:18<00:08, 315.97it/s]\u001b[A\n",
|
748 |
+
" 66% 5043/7609 [00:18<00:07, 320.87it/s]\u001b[A\n",
|
749 |
+
" 67% 5079/7609 [00:18<00:07, 330.68it/s]\u001b[A\n",
|
750 |
+
" 67% 5114/7609 [00:18<00:07, 332.38it/s]\u001b[A\n",
|
751 |
+
" 68% 5148/7609 [00:18<00:07, 329.51it/s]\u001b[A\n",
|
752 |
+
" 68% 5182/7609 [00:19<00:07, 311.81it/s]\u001b[A\n",
|
753 |
+
" 69% 5214/7609 [00:19<00:07, 312.15it/s]\u001b[A\n",
|
754 |
+
" 69% 5247/7609 [00:19<00:07, 316.38it/s]\u001b[A\n",
|
755 |
+
" 69% 5279/7609 [00:19<00:07, 316.20it/s]\u001b[A\n",
|
756 |
+
" 70% 5311/7609 [00:19<00:07, 295.70it/s]\u001b[A\n",
|
757 |
+
" 70% 5341/7609 [00:19<00:08, 261.36it/s]\u001b[A\n",
|
758 |
+
" 71% 5368/7609 [00:19<00:09, 230.83it/s]\u001b[A\n",
|
759 |
+
" 71% 5393/7609 [00:19<00:10, 216.96it/s]\u001b[A\n",
|
760 |
+
" 71% 5416/7609 [00:20<00:10, 207.34it/s]\u001b[A\n",
|
761 |
+
" 71% 5438/7609 [00:20<00:10, 202.91it/s]\u001b[A\n",
|
762 |
+
" 72% 5459/7609 [00:20<00:10, 199.16it/s]\u001b[A\n",
|
763 |
+
" 72% 5480/7609 [00:20<00:11, 189.04it/s]\u001b[A\n",
|
764 |
+
" 72% 5500/7609 [00:20<00:11, 182.60it/s]\u001b[A\n",
|
765 |
+
" 73% 5519/7609 [00:20<00:11, 180.96it/s]\u001b[A\n",
|
766 |
+
" 73% 5538/7609 [00:20<00:11, 181.22it/s]\u001b[A\n",
|
767 |
+
" 73% 5557/7609 [00:20<00:11, 171.68it/s]\u001b[A\n",
|
768 |
+
" 73% 5576/7609 [00:21<00:11, 174.81it/s]\u001b[A\n",
|
769 |
+
" 74% 5596/7609 [00:21<00:11, 180.04it/s]\u001b[A\n",
|
770 |
+
" 74% 5616/7609 [00:21<00:10, 182.81it/s]\u001b[A\n",
|
771 |
+
" 74% 5635/7609 [00:21<00:10, 182.33it/s]\u001b[A\n",
|
772 |
+
" 74% 5654/7609 [00:21<00:11, 174.84it/s]\u001b[A\n",
|
773 |
+
" 75% 5674/7609 [00:21<00:10, 180.47it/s]\u001b[A\n",
|
774 |
+
" 75% 5694/7609 [00:21<00:10, 184.70it/s]\u001b[A\n",
|
775 |
+
" 75% 5716/7609 [00:21<00:09, 192.61it/s]\u001b[A\n",
|
776 |
+
" 75% 5737/7609 [00:21<00:09, 197.48it/s]\u001b[A\n",
|
777 |
+
" 76% 5759/7609 [00:21<00:09, 203.11it/s]\u001b[A\n",
|
778 |
+
" 76% 5781/7609 [00:22<00:08, 206.83it/s]\u001b[A\n",
|
779 |
+
" 76% 5804/7609 [00:22<00:08, 212.42it/s]\u001b[A\n",
|
780 |
+
" 77% 5826/7609 [00:22<00:08, 212.86it/s]\u001b[A\n",
|
781 |
+
" 77% 5848/7609 [00:22<00:09, 195.42it/s]\u001b[A\n",
|
782 |
+
" 77% 5869/7609 [00:22<00:08, 197.24it/s]\u001b[A\n",
|
783 |
+
" 77% 5890/7609 [00:22<00:08, 199.90it/s]\u001b[A\n",
|
784 |
+
" 78% 5911/7609 [00:22<00:08, 200.35it/s]\u001b[A\n",
|
785 |
+
" 78% 5932/7609 [00:22<00:08, 194.76it/s]\u001b[A\n",
|
786 |
+
" 78% 5952/7609 [00:22<00:09, 179.45it/s]\u001b[A\n",
|
787 |
+
" 78% 5973/7609 [00:23<00:08, 185.49it/s]\u001b[A\n",
|
788 |
+
" 79% 5994/7609 [00:23<00:08, 191.03it/s]\u001b[A\n",
|
789 |
+
" 79% 6014/7609 [00:23<00:08, 190.49it/s]\u001b[A\n",
|
790 |
+
" 79% 6034/7609 [00:23<00:10, 152.17it/s]\u001b[A\n",
|
791 |
+
" 80% 6055/7609 [00:23<00:09, 166.05it/s]\u001b[A\n",
|
792 |
+
" 80% 6090/7609 [00:23<00:07, 212.83it/s]\u001b[A\n",
|
793 |
+
" 80% 6113/7609 [00:23<00:06, 216.74it/s]\u001b[A\n",
|
794 |
+
" 81% 6136/7609 [00:23<00:07, 192.53it/s]\u001b[A\n",
|
795 |
+
" 81% 6157/7609 [00:24<00:07, 182.48it/s]\u001b[A\n",
|
796 |
+
" 81% 6191/7609 [00:24<00:06, 221.58it/s]\u001b[A\n",
|
797 |
+
" 82% 6229/7609 [00:24<00:05, 263.29it/s]\u001b[A\n",
|
798 |
+
" 82% 6267/7609 [00:24<00:04, 293.51it/s]\u001b[A\n",
|
799 |
+
" 83% 6301/7609 [00:24<00:04, 305.98it/s]\u001b[A\n",
|
800 |
+
" 83% 6337/7609 [00:24<00:03, 319.28it/s]\u001b[A\n",
|
801 |
+
" 84% 6372/7609 [00:24<00:03, 326.62it/s]\u001b[A\n",
|
802 |
+
" 84% 6411/7609 [00:24<00:03, 343.54it/s]\u001b[A\n",
|
803 |
+
" 85% 6446/7609 [00:24<00:03, 344.44it/s]\u001b[A\n",
|
804 |
+
" 85% 6482/7609 [00:24<00:03, 343.79it/s]\u001b[A\n",
|
805 |
+
" 86% 6517/7609 [00:25<00:03, 333.86it/s]\u001b[A\n",
|
806 |
+
" 86% 6551/7609 [00:25<00:03, 334.22it/s]\u001b[A\n",
|
807 |
+
" 87% 6585/7609 [00:25<00:03, 333.76it/s]\u001b[A\n",
|
808 |
+
" 87% 6619/7609 [00:25<00:03, 311.16it/s]\u001b[A\n",
|
809 |
+
" 87% 6654/7609 [00:25<00:02, 320.94it/s]\u001b[A\n",
|
810 |
+
" 88% 6687/7609 [00:25<00:02, 307.52it/s]\u001b[A\n",
|
811 |
+
" 88% 6723/7609 [00:25<00:02, 319.98it/s]\u001b[A\n",
|
812 |
+
" 89% 6756/7609 [00:25<00:02, 310.88it/s]\u001b[A\n",
|
813 |
+
" 89% 6789/7609 [00:25<00:02, 315.16it/s]\u001b[A\n",
|
814 |
+
" 90% 6821/7609 [00:26<00:02, 296.81it/s]\u001b[A\n",
|
815 |
+
" 90% 6851/7609 [00:26<00:02, 296.11it/s]\u001b[A\n",
|
816 |
+
" 90% 6881/7609 [00:26<00:02, 292.78it/s]\u001b[A\n",
|
817 |
+
" 91% 6918/7609 [00:26<00:02, 313.41it/s]\u001b[A\n",
|
818 |
+
" 91% 6950/7609 [00:26<00:02, 309.36it/s]\u001b[A\n",
|
819 |
+
" 92% 6984/7609 [00:26<00:01, 318.01it/s]\u001b[A\n",
|
820 |
+
" 92% 7017/7609 [00:26<00:01, 320.20it/s]\u001b[A\n",
|
821 |
+
" 93% 7050/7609 [00:26<00:01, 315.20it/s]\u001b[A\n",
|
822 |
+
" 93% 7082/7609 [00:26<00:01, 275.84it/s]\u001b[A\n",
|
823 |
+
" 93% 7111/7609 [00:27<00:01, 268.80it/s]\u001b[A\n",
|
824 |
+
" 94% 7139/7609 [00:27<00:01, 263.91it/s]\u001b[A\n",
|
825 |
+
" 94% 7166/7609 [00:27<00:01, 258.96it/s]\u001b[A\n",
|
826 |
+
" 95% 7193/7609 [00:27<00:01, 257.97it/s]\u001b[A\n",
|
827 |
+
" 95% 7226/7609 [00:27<00:01, 276.82it/s]\u001b[A\n",
|
828 |
+
" 95% 7258/7609 [00:27<00:01, 285.61it/s]\u001b[A\n",
|
829 |
+
" 96% 7292/7609 [00:27<00:01, 299.67it/s]\u001b[A\n",
|
830 |
+
" 96% 7325/7609 [00:27<00:00, 304.21it/s]\u001b[A\n",
|
831 |
+
" 97% 7357/7609 [00:27<00:00, 306.98it/s]\u001b[A\n",
|
832 |
+
" 97% 7391/7609 [00:28<00:00, 315.60it/s]\u001b[A\n",
|
833 |
+
" 98% 7423/7609 [00:28<00:00, 315.29it/s]\u001b[A\n",
|
834 |
+
" 98% 7455/7609 [00:28<00:00, 302.11it/s]\u001b[A\n",
|
835 |
+
" 98% 7486/7609 [00:28<00:00, 292.74it/s]\u001b[A\n",
|
836 |
+
" 99% 7516/7609 [00:28<00:00, 284.68it/s]\u001b[A\n",
|
837 |
+
" 99% 7545/7609 [00:28<00:00, 270.13it/s]\u001b[A\n",
|
838 |
+
"100% 7573/7609 [00:28<00:00, 254.51it/s]\u001b[A\n",
|
839 |
+
"100% 7609/7609 [00:28<00:00, 263.94it/s]\n",
|
840 |
+
"06/07/2023 16:53:17 - INFO - utils_qa - Saving predictions to eval_results/predict_predictions.json.\n",
|
841 |
+
"06/07/2023 16:53:17 - INFO - utils_qa - Saving nbest_preds to eval_results/predict_nbest_predictions.json.\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
842 |
"***** predict metrics *****\n",
|
843 |
" predict_samples = 8565\n",
|
844 |
+
" test_exact_match = 70.0486\n",
|
845 |
+
" test_f1 = 80.9773\n",
|
846 |
+
" test_runtime = 0:04:47.64\n",
|
847 |
+
" test_samples_per_second = 29.777\n",
|
848 |
+
" test_steps_per_second = 5.955\n",
|
849 |
+
"[INFO|modelcard.py:451] 2023-06-07 16:53:20,099 >> Dropping the following result as it does not have all the necessary fields:\n",
|
850 |
"{'task': {'name': 'Question Answering', 'type': 'question-answering'}, 'dataset': {'name': 'squad_it', 'type': 'squad_it'}}\n",
|
851 |
+
"100% 1713/1713 [05:28<00:00, 5.22it/s]\n"
|
852 |
]
|
853 |
}
|
854 |
]
|