Saving weights and logs of step 5000
Browse files- events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2 +3 -0
- flax_model.msgpack +1 -1
- run_pretraining.sh +4 -4
- wandb/debug-internal.log +1 -1
- wandb/debug.log +1 -1
- wandb/latest-run +1 -1
- wandb/run-20210709_141445-2k8cnty2/files/config.yaml +4 -0
- wandb/run-20210709_141445-2k8cnty2/files/output.log +14 -0
- wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json +1 -1
- wandb/run-20210709_141445-2k8cnty2/logs/debug-internal.log +136 -0
- wandb/run-20210709_141445-2k8cnty2/logs/debug.log +135 -0
- wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb +0 -0
- wandb/run-20210709_144100-2k1kyrq2/files/conda-environment.yaml +187 -0
- wandb/run-20210709_144100-2k1kyrq2/files/config.yaml +305 -0
- wandb/run-20210709_144100-2k1kyrq2/files/events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2 +1 -0
- wandb/run-20210709_144100-2k1kyrq2/files/output.log +0 -0
- wandb/run-20210709_144100-2k1kyrq2/files/requirements.txt +153 -0
- wandb/run-20210709_144100-2k1kyrq2/files/wandb-metadata.json +48 -0
- wandb/run-20210709_144100-2k1kyrq2/files/wandb-summary.json +1 -0
- wandb/run-20210709_144100-2k1kyrq2/logs/debug-internal.log +0 -0
- wandb/run-20210709_144100-2k1kyrq2/logs/debug.log +29 -0
- wandb/run-20210709_144100-2k1kyrq2/run-2k1kyrq2.wandb +0 -0
events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65f1a7d1164ca3b62fcc3dea900488379e35e8dbc651d2d586a093e695813bb7
|
3 |
+
size 735138
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1419302302
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c82df389e510b831d9a5c33f348a258ef105f78170ccc3efd78ab838d40a038b
|
3 |
size 1419302302
|
run_pretraining.sh
CHANGED
@@ -20,8 +20,8 @@ export WANDB_LOG_MODEL="true"
|
|
20 |
--num_train_epochs="20" \
|
21 |
--dataloader_num_workers="64" \
|
22 |
--preprocessing_num_workers="64" \
|
23 |
-
--
|
24 |
-
--
|
25 |
-
--
|
26 |
-
--
|
27 |
--push_to_hub
|
|
|
20 |
--num_train_epochs="20" \
|
21 |
--dataloader_num_workers="64" \
|
22 |
--preprocessing_num_workers="64" \
|
23 |
+
--logging_steps="5000" \
|
24 |
+
--save_steps="5000" \
|
25 |
+
--eval_steps="5000" \
|
26 |
+
--validation_split_percentage="2" \
|
27 |
--push_to_hub
|
wandb/debug-internal.log
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
|
|
1 |
+
run-20210709_144100-2k1kyrq2/logs/debug-internal.log
|
wandb/debug.log
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
|
|
1 |
+
run-20210709_144100-2k1kyrq2/logs/debug.log
|
wandb/latest-run
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
|
|
1 |
+
run-20210709_144100-2k1kyrq2
|
wandb/run-20210709_141445-2k8cnty2/files/config.yaml
CHANGED
@@ -20,6 +20,10 @@ _wandb:
|
|
20 |
- 1
|
21 |
- 3
|
22 |
- 11
|
|
|
|
|
|
|
|
|
23 |
4: 3.8.10
|
24 |
5: 0.10.33
|
25 |
6: 4.9.0.dev0
|
|
|
20 |
- 1
|
21 |
- 3
|
22 |
- 11
|
23 |
+
2:
|
24 |
+
- 1
|
25 |
+
- 3
|
26 |
+
- 11
|
27 |
4: 3.8.10
|
28 |
5: 0.10.33
|
29 |
6: 4.9.0.dev0
|
wandb/run-20210709_141445-2k8cnty2/files/output.log
CHANGED
@@ -528,3 +528,17 @@ Training...: 92%|████████████████████
|
|
528 |
Evaluating...: 0%| | 0/5 [00:00<?, ?it/s]
|
529 |
|
530 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
528 |
Evaluating...: 0%| | 0/5 [00:00<?, ?it/s]
|
529 |
|
530 |
|
531 |
+
Model weights saved in /home/cahya/Work/flax-community/gpt2-medium-indonesian/flax_model.msgpack██████████████████████████████████████████████████████████████████████████████████████████████████████ | 48/52 [05:47<00:06, 1.74s/it]
|
532 |
+
Model pushed to the hub in this commit: https://huggingface.co/flax-community/gpt2-medium-indonesian/commit/9b9473462e797993d7ca4cfb92daa71c0bc81e9d
|
533 |
+
Step... (100 | Eval Loss: 7.69423770904541 | Eval Perplexity: 2195.65944089946): 10%|████████████▌ | 2/20 [14:54<2:13:01, 443.41s/it]
|
534 |
+
|
535 |
+
Training...: 12%|██████████████████████▌ | 6/52 [00:01<00:10, 4.36it/s]
|
536 |
+
File "./run_clm_flax.py", line 655, in <module>
|
537 |
+
main()
|
538 |
+
File "./run_clm_flax.py", line 620, in main
|
539 |
+
batch = next(eval_loader)
|
540 |
+
File "./run_clm_flax.py", line 193, in data_loader
|
541 |
+
for idx in batch_idx:
|
542 |
+
File "/home/cahya/miniconda3/envs/jax/lib/python3.8/site-packages/jax/interpreters/xla.py", line 1264, in __iter__
|
543 |
+
return self._value.__iter__()
|
544 |
+
KeyboardInterrupt
|
wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"global_step":
|
|
|
1 |
+
{"global_step": 100, "_timestamp": 1625840946.414606, "eval_loss": 7.69423770904541, "eval_perplexity": 2195.659423828125, "_step": 9}
|
wandb/run-20210709_141445-2k8cnty2/logs/debug-internal.log
CHANGED
@@ -330,3 +330,139 @@
|
|
330 |
2021-07-09 14:29:24,657 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
331 |
2021-07-09 14:29:28,577 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
332 |
2021-07-09 14:29:28,578 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
330 |
2021-07-09 14:29:24,657 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
331 |
2021-07-09 14:29:28,577 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
332 |
2021-07-09 14:29:28,578 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
333 |
+
2021-07-09 14:29:43,713 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
334 |
+
2021-07-09 14:29:43,713 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
335 |
+
2021-07-09 14:29:47,814 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
|
336 |
+
2021-07-09 14:29:58,843 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
337 |
+
2021-07-09 14:29:58,844 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
338 |
+
2021-07-09 14:30:13,979 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
339 |
+
2021-07-09 14:30:13,980 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
340 |
+
2021-07-09 14:30:17,889 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
|
341 |
+
2021-07-09 14:30:24,683 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
342 |
+
2021-07-09 14:30:26,684 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
343 |
+
2021-07-09 14:30:28,685 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
344 |
+
2021-07-09 14:30:29,111 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
|
345 |
+
2021-07-09 14:30:29,111 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
|
346 |
+
2021-07-09 14:30:30,097 WARNING MainThread:246776 [internal.py:wandb_internal():147] Internal process interrupt: 1
|
347 |
+
2021-07-09 14:30:30,685 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
348 |
+
2021-07-09 14:30:34,687 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
349 |
+
2021-07-09 14:30:36,622 DEBUG SenderThread:246776 [sender.py:send():179] send: telemetry
|
350 |
+
2021-07-09 14:30:36,622 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
351 |
+
2021-07-09 14:30:36,622 DEBUG SenderThread:246776 [sender.py:send():179] send: exit
|
352 |
+
2021-07-09 14:30:36,622 INFO SenderThread:246776 [sender.py:send_exit():287] handling exit code: 255
|
353 |
+
2021-07-09 14:30:36,623 INFO SenderThread:246776 [sender.py:send_exit():295] send defer
|
354 |
+
2021-07-09 14:30:36,623 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
355 |
+
2021-07-09 14:30:36,624 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
356 |
+
2021-07-09 14:30:36,624 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 0
|
357 |
+
2021-07-09 14:30:36,624 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
358 |
+
2021-07-09 14:30:36,624 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 0
|
359 |
+
2021-07-09 14:30:36,624 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 1
|
360 |
+
2021-07-09 14:30:36,624 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
361 |
+
2021-07-09 14:30:36,624 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 1
|
362 |
+
2021-07-09 14:30:36,631 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
363 |
+
2021-07-09 14:30:36,631 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 1
|
364 |
+
2021-07-09 14:30:36,631 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 2
|
365 |
+
2021-07-09 14:30:36,631 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
|
366 |
+
2021-07-09 14:30:36,632 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
367 |
+
2021-07-09 14:30:36,632 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 2
|
368 |
+
2021-07-09 14:30:36,688 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
369 |
+
2021-07-09 14:30:42,961 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
370 |
+
2021-07-09 14:30:42,961 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
371 |
+
2021-07-09 14:30:42,961 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 2
|
372 |
+
2021-07-09 14:30:42,961 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
373 |
+
2021-07-09 14:30:42,961 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 3
|
374 |
+
2021-07-09 14:30:42,962 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
375 |
+
2021-07-09 14:30:42,962 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
376 |
+
2021-07-09 14:30:42,963 DEBUG SenderThread:246776 [sender.py:send():179] send: history
|
377 |
+
2021-07-09 14:30:42,963 DEBUG SenderThread:246776 [sender.py:send():179] send: summary
|
378 |
+
2021-07-09 14:30:42,963 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
379 |
+
2021-07-09 14:30:42,964 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 3
|
380 |
+
2021-07-09 14:30:42,964 INFO SenderThread:246776 [sender.py:_save_file():841] saving file wandb-summary.json with policy end
|
381 |
+
2021-07-09 14:30:42,964 DEBUG SenderThread:246776 [sender.py:send():179] send: summary
|
382 |
+
2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:_save_file():841] saving file wandb-summary.json with policy end
|
383 |
+
2021-07-09 14:30:42,965 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
384 |
+
2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 3
|
385 |
+
2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 4
|
386 |
+
2021-07-09 14:30:42,965 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
387 |
+
2021-07-09 14:30:42,965 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 4
|
388 |
+
2021-07-09 14:30:42,965 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
389 |
+
2021-07-09 14:30:42,966 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 4
|
390 |
+
2021-07-09 14:30:43,065 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
391 |
+
2021-07-09 14:30:43,170 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 5
|
392 |
+
2021-07-09 14:30:43,170 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
393 |
+
2021-07-09 14:30:43,171 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
394 |
+
2021-07-09 14:30:43,171 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 5
|
395 |
+
2021-07-09 14:30:43,171 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
396 |
+
2021-07-09 14:30:43,171 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 5
|
397 |
+
2021-07-09 14:30:43,171 INFO SenderThread:246776 [dir_watcher.py:finish():282] shutting down directory watcher
|
398 |
+
2021-07-09 14:30:43,272 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
399 |
+
2021-07-09 14:30:43,690 INFO SenderThread:246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml
|
400 |
+
2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json
|
401 |
+
2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():312] scan: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files
|
402 |
+
2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/conda-environment.yaml conda-environment.yaml
|
403 |
+
2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/requirements.txt requirements.txt
|
404 |
+
2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log output.log
|
405 |
+
2021-07-09 14:30:43,692 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-metadata.json wandb-metadata.json
|
406 |
+
2021-07-09 14:30:43,692 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml config.yaml
|
407 |
+
2021-07-09 14:30:43,695 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2 events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2
|
408 |
+
2021-07-09 14:30:43,695 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json wandb-summary.json
|
409 |
+
2021-07-09 14:30:43,695 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 6
|
410 |
+
2021-07-09 14:30:43,695 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
411 |
+
2021-07-09 14:30:43,696 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
412 |
+
2021-07-09 14:30:43,705 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 6
|
413 |
+
2021-07-09 14:30:43,705 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
414 |
+
2021-07-09 14:30:43,705 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 6
|
415 |
+
2021-07-09 14:30:43,705 INFO SenderThread:246776 [file_pusher.py:finish():177] shutting down file pusher
|
416 |
+
2021-07-09 14:30:43,798 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
417 |
+
2021-07-09 14:30:43,798 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
418 |
+
2021-07-09 14:30:43,900 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
419 |
+
2021-07-09 14:30:43,900 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
420 |
+
2021-07-09 14:30:44,002 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
421 |
+
2021-07-09 14:30:44,002 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
422 |
+
2021-07-09 14:30:44,104 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
423 |
+
2021-07-09 14:30:44,104 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
424 |
+
2021-07-09 14:30:44,144 INFO Thread-24 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml
|
425 |
+
2021-07-09 14:30:44,145 INFO Thread-22 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/requirements.txt
|
426 |
+
2021-07-09 14:30:44,154 INFO Thread-21 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/conda-environment.yaml
|
427 |
+
2021-07-09 14:30:44,183 INFO Thread-26 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json
|
428 |
+
2021-07-09 14:30:44,206 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
429 |
+
2021-07-09 14:30:44,206 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
430 |
+
2021-07-09 14:30:44,232 INFO Thread-25 :246776 [upload_job.py:push():137] Uploaded file /tmp/tmp4f0a6i2mwandb/i1mxdnz1-events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2
|
431 |
+
2021-07-09 14:30:44,307 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
432 |
+
2021-07-09 14:30:44,308 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
433 |
+
2021-07-09 14:30:44,359 INFO Thread-23 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
|
434 |
+
2021-07-09 14:30:44,409 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
435 |
+
2021-07-09 14:30:44,409 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
436 |
+
2021-07-09 14:30:44,511 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
437 |
+
2021-07-09 14:30:44,511 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
438 |
+
2021-07-09 14:30:44,559 INFO Thread-7 :246776 [sender.py:transition_state():308] send defer: 7
|
439 |
+
2021-07-09 14:30:44,560 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
440 |
+
2021-07-09 14:30:44,560 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 7
|
441 |
+
2021-07-09 14:30:44,560 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
442 |
+
2021-07-09 14:30:44,560 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 7
|
443 |
+
2021-07-09 14:30:44,612 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
444 |
+
2021-07-09 14:30:44,831 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 8
|
445 |
+
2021-07-09 14:30:44,831 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
446 |
+
2021-07-09 14:30:44,832 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
447 |
+
2021-07-09 14:30:44,832 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 8
|
448 |
+
2021-07-09 14:30:44,832 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
449 |
+
2021-07-09 14:30:44,832 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 8
|
450 |
+
2021-07-09 14:30:44,832 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 9
|
451 |
+
2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send():179] send: final
|
452 |
+
2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send():179] send: footer
|
453 |
+
2021-07-09 14:30:44,833 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
|
454 |
+
2021-07-09 14:30:44,833 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 9
|
455 |
+
2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
|
456 |
+
2021-07-09 14:30:44,833 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 9
|
457 |
+
2021-07-09 14:30:44,933 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
|
458 |
+
2021-07-09 14:30:44,933 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
|
459 |
+
2021-07-09 14:30:44,933 INFO SenderThread:246776 [file_pusher.py:join():182] waiting for file pusher
|
460 |
+
2021-07-09 14:30:44,935 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: get_summary
|
461 |
+
2021-07-09 14:30:44,936 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: sampled_history
|
462 |
+
2021-07-09 14:30:44,937 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: shutdown
|
463 |
+
2021-07-09 14:30:44,937 INFO HandlerThread:246776 [handler.py:finish():638] shutting down handler
|
464 |
+
2021-07-09 14:30:45,833 INFO WriterThread:246776 [datastore.py:close():288] close: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb
|
465 |
+
2021-07-09 14:30:45,934 INFO SenderThread:246776 [sender.py:finish():945] shutting down sender
|
466 |
+
2021-07-09 14:30:45,934 INFO SenderThread:246776 [file_pusher.py:finish():177] shutting down file pusher
|
467 |
+
2021-07-09 14:30:45,934 INFO SenderThread:246776 [file_pusher.py:join():182] waiting for file pusher
|
468 |
+
2021-07-09 14:30:45,936 INFO MainThread:246776 [internal.py:handle_exit():78] Internal process exited
|
wandb/run-20210709_141445-2k8cnty2/logs/debug.log
CHANGED
@@ -27,3 +27,138 @@ config: {}
|
|
27 |
2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fab4d59abb0>>
|
28 |
2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
|
29 |
2021-07-09 14:15:27,424 INFO MainThread:245719 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
27 |
2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fab4d59abb0>>
|
28 |
2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
|
29 |
2021-07-09 14:15:27,424 INFO MainThread:245719 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
|
30 |
+
2021-07-09 14:30:34,276 INFO MainThread:245719 [wandb_run.py:_atexit_cleanup():1593] got exitcode: 255
|
31 |
+
2021-07-09 14:30:34,276 INFO MainThread:245719 [wandb_run.py:_restore():1565] restore
|
32 |
+
2021-07-09 14:30:36,624 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
33 |
+
wandb_count: 1
|
34 |
+
other_count: 1
|
35 |
+
}
|
36 |
+
pusher_stats {
|
37 |
+
uploaded_bytes: 3022
|
38 |
+
total_bytes: 3022
|
39 |
+
}
|
40 |
+
|
41 |
+
2021-07-09 14:30:41,726 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: None
|
42 |
+
2021-07-09 14:30:42,963 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
43 |
+
wandb_count: 1
|
44 |
+
other_count: 1
|
45 |
+
}
|
46 |
+
pusher_stats {
|
47 |
+
uploaded_bytes: 3022
|
48 |
+
total_bytes: 3022
|
49 |
+
}
|
50 |
+
|
51 |
+
2021-07-09 14:30:43,171 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
52 |
+
wandb_count: 1
|
53 |
+
other_count: 1
|
54 |
+
}
|
55 |
+
pusher_stats {
|
56 |
+
uploaded_bytes: 3022
|
57 |
+
total_bytes: 3022
|
58 |
+
}
|
59 |
+
|
60 |
+
2021-07-09 14:30:43,697 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
61 |
+
wandb_count: 5
|
62 |
+
other_count: 1
|
63 |
+
}
|
64 |
+
pusher_stats {
|
65 |
+
uploaded_bytes: 3022
|
66 |
+
total_bytes: 100895
|
67 |
+
}
|
68 |
+
|
69 |
+
2021-07-09 14:30:43,799 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
70 |
+
wandb_count: 6
|
71 |
+
other_count: 1
|
72 |
+
}
|
73 |
+
pusher_stats {
|
74 |
+
uploaded_bytes: 1722
|
75 |
+
total_bytes: 101169
|
76 |
+
}
|
77 |
+
|
78 |
+
2021-07-09 14:30:43,901 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
79 |
+
wandb_count: 6
|
80 |
+
other_count: 1
|
81 |
+
}
|
82 |
+
pusher_stats {
|
83 |
+
uploaded_bytes: 101169
|
84 |
+
total_bytes: 101169
|
85 |
+
}
|
86 |
+
|
87 |
+
2021-07-09 14:30:44,003 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
88 |
+
wandb_count: 6
|
89 |
+
other_count: 1
|
90 |
+
}
|
91 |
+
pusher_stats {
|
92 |
+
uploaded_bytes: 101169
|
93 |
+
total_bytes: 101169
|
94 |
+
}
|
95 |
+
|
96 |
+
2021-07-09 14:30:44,104 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
97 |
+
wandb_count: 6
|
98 |
+
other_count: 1
|
99 |
+
}
|
100 |
+
pusher_stats {
|
101 |
+
uploaded_bytes: 101169
|
102 |
+
total_bytes: 101169
|
103 |
+
}
|
104 |
+
|
105 |
+
2021-07-09 14:30:44,206 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
106 |
+
wandb_count: 6
|
107 |
+
other_count: 1
|
108 |
+
}
|
109 |
+
pusher_stats {
|
110 |
+
uploaded_bytes: 101169
|
111 |
+
total_bytes: 101169
|
112 |
+
}
|
113 |
+
|
114 |
+
2021-07-09 14:30:44,308 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
115 |
+
wandb_count: 6
|
116 |
+
other_count: 1
|
117 |
+
}
|
118 |
+
pusher_stats {
|
119 |
+
uploaded_bytes: 101169
|
120 |
+
total_bytes: 101169
|
121 |
+
}
|
122 |
+
|
123 |
+
2021-07-09 14:30:44,410 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
124 |
+
wandb_count: 6
|
125 |
+
other_count: 1
|
126 |
+
}
|
127 |
+
pusher_stats {
|
128 |
+
uploaded_bytes: 101169
|
129 |
+
total_bytes: 101169
|
130 |
+
}
|
131 |
+
|
132 |
+
2021-07-09 14:30:44,511 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
133 |
+
wandb_count: 6
|
134 |
+
other_count: 1
|
135 |
+
}
|
136 |
+
pusher_stats {
|
137 |
+
uploaded_bytes: 101169
|
138 |
+
total_bytes: 101169
|
139 |
+
}
|
140 |
+
|
141 |
+
2021-07-09 14:30:44,832 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
|
142 |
+
wandb_count: 6
|
143 |
+
other_count: 1
|
144 |
+
}
|
145 |
+
pusher_stats {
|
146 |
+
uploaded_bytes: 101169
|
147 |
+
total_bytes: 101169
|
148 |
+
}
|
149 |
+
|
150 |
+
2021-07-09 14:30:44,934 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: done: true
|
151 |
+
exit_result {
|
152 |
+
}
|
153 |
+
file_counts {
|
154 |
+
wandb_count: 6
|
155 |
+
other_count: 1
|
156 |
+
}
|
157 |
+
pusher_stats {
|
158 |
+
uploaded_bytes: 101169
|
159 |
+
total_bytes: 101169
|
160 |
+
}
|
161 |
+
|
162 |
+
2021-07-09 14:30:46,219 INFO MainThread:245719 [wandb_run.py:_show_summary():1870] rendering summary
|
163 |
+
2021-07-09 14:30:46,220 INFO MainThread:245719 [wandb_run.py:_show_history():1908] rendering history
|
164 |
+
2021-07-09 14:30:46,220 INFO MainThread:245719 [wandb_run.py:_show_files():1937] logging synced files
|
wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb
CHANGED
Binary files a/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb and b/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb differ
|
|
wandb/run-20210709_144100-2k1kyrq2/files/conda-environment.yaml
ADDED
@@ -0,0 +1,187 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
name: jax
|
2 |
+
channels:
|
3 |
+
- pytorch
|
4 |
+
- conda-forge
|
5 |
+
- defaults
|
6 |
+
dependencies:
|
7 |
+
- _libgcc_mutex=0.1=main
|
8 |
+
- _openmp_mutex=4.5=1_gnu
|
9 |
+
- anyio=3.2.1=py38h578d9bd_0
|
10 |
+
- argon2-cffi=20.1.0=py38h497a2fe_2
|
11 |
+
- async_generator=1.10=py_0
|
12 |
+
- attrs=21.2.0=pyhd8ed1ab_0
|
13 |
+
- babel=2.9.1=pyh44b312d_0
|
14 |
+
- backcall=0.2.0=pyh9f0ad1d_0
|
15 |
+
- backports=1.0=py_2
|
16 |
+
- backports.functools_lru_cache=1.6.4=pyhd8ed1ab_0
|
17 |
+
- blas=1.0=mkl
|
18 |
+
- bleach=3.3.0=pyh44b312d_0
|
19 |
+
- brotlipy=0.7.0=py38h497a2fe_1001
|
20 |
+
- ca-certificates=2021.5.30=ha878542_0
|
21 |
+
- certifi=2021.5.30=py38h578d9bd_0
|
22 |
+
- cffi=1.14.5=py38ha65f79e_0
|
23 |
+
- chardet=4.0.0=py38h578d9bd_1
|
24 |
+
- cryptography=3.4.7=py38ha5dfef3_0
|
25 |
+
- cudatoolkit=10.2.89=hfd86e86_1
|
26 |
+
- debugpy=1.3.0=py38h709712a_0
|
27 |
+
- decorator=5.0.9=pyhd8ed1ab_0
|
28 |
+
- defusedxml=0.7.1=pyhd8ed1ab_0
|
29 |
+
- entrypoints=0.3=pyhd8ed1ab_1003
|
30 |
+
- idna=2.10=pyh9f0ad1d_0
|
31 |
+
- importlib-metadata=4.6.1=py38h578d9bd_0
|
32 |
+
- intel-openmp=2021.2.0=h06a4308_610
|
33 |
+
- ipykernel=6.0.1=py38hd0cf306_0
|
34 |
+
- ipython=7.25.0=py38hd0cf306_1
|
35 |
+
- ipython_genutils=0.2.0=py_1
|
36 |
+
- jedi=0.18.0=py38h578d9bd_2
|
37 |
+
- jinja2=3.0.1=pyhd8ed1ab_0
|
38 |
+
- json5=0.9.5=pyh9f0ad1d_0
|
39 |
+
- jsonschema=3.2.0=pyhd8ed1ab_3
|
40 |
+
- jupyter_client=6.1.12=pyhd8ed1ab_0
|
41 |
+
- jupyter_core=4.7.1=py38h578d9bd_0
|
42 |
+
- jupyter_server=1.9.0=pyhd8ed1ab_0
|
43 |
+
- jupyterlab=3.0.16=pyhd8ed1ab_0
|
44 |
+
- jupyterlab_pygments=0.1.2=pyh9f0ad1d_0
|
45 |
+
- jupyterlab_server=2.6.0=pyhd8ed1ab_0
|
46 |
+
- ld_impl_linux-64=2.35.1=h7274673_9
|
47 |
+
- libffi=3.3=he6710b0_2
|
48 |
+
- libgcc-ng=9.3.0=h5101ec6_17
|
49 |
+
- libgomp=9.3.0=h5101ec6_17
|
50 |
+
- libsodium=1.0.18=h36c2ea0_1
|
51 |
+
- libstdcxx-ng=9.3.0=hd4cf53a_17
|
52 |
+
- libuv=1.40.0=h7b6447c_0
|
53 |
+
- markupsafe=2.0.1=py38h497a2fe_0
|
54 |
+
- matplotlib-inline=0.1.2=pyhd8ed1ab_2
|
55 |
+
- mistune=0.8.4=py38h497a2fe_1004
|
56 |
+
- mkl=2021.2.0=h06a4308_296
|
57 |
+
- nbclassic=0.3.1=pyhd8ed1ab_1
|
58 |
+
- nbclient=0.5.3=pyhd8ed1ab_0
|
59 |
+
- nbconvert=6.1.0=py38h578d9bd_0
|
60 |
+
- nbformat=5.1.3=pyhd8ed1ab_0
|
61 |
+
- ncurses=6.2=he6710b0_1
|
62 |
+
- nest-asyncio=1.5.1=pyhd8ed1ab_0
|
63 |
+
- ninja=1.10.2=hff7bd54_1
|
64 |
+
- notebook=6.4.0=pyha770c72_0
|
65 |
+
- openssl=1.1.1k=h7f98852_0
|
66 |
+
- pandoc=2.14.0.3=h7f98852_0
|
67 |
+
- pandocfilters=1.4.2=py_1
|
68 |
+
- parso=0.8.2=pyhd8ed1ab_0
|
69 |
+
- pexpect=4.8.0=pyh9f0ad1d_2
|
70 |
+
- pickleshare=0.7.5=py_1003
|
71 |
+
- pip=21.1.3=py38h06a4308_0
|
72 |
+
- prometheus_client=0.11.0=pyhd8ed1ab_0
|
73 |
+
- prompt-toolkit=3.0.19=pyha770c72_0
|
74 |
+
- ptyprocess=0.7.0=pyhd3deb0d_0
|
75 |
+
- pycparser=2.20=pyh9f0ad1d_2
|
76 |
+
- pygments=2.9.0=pyhd8ed1ab_0
|
77 |
+
- pyopenssl=20.0.1=pyhd8ed1ab_0
|
78 |
+
- pyparsing=2.4.7=pyh9f0ad1d_0
|
79 |
+
- pyrsistent=0.17.3=py38h497a2fe_2
|
80 |
+
- pysocks=1.7.1=py38h578d9bd_3
|
81 |
+
- python=3.8.10=h12debd9_8
|
82 |
+
- python-dateutil=2.8.1=py_0
|
83 |
+
- python_abi=3.8=2_cp38
|
84 |
+
- pytorch=1.9.0=py3.8_cuda10.2_cudnn7.6.5_0
|
85 |
+
- pytz=2021.1=pyhd8ed1ab_0
|
86 |
+
- pyzmq=22.1.0=py38h2035c66_0
|
87 |
+
- readline=8.1=h27cfd23_0
|
88 |
+
- requests=2.25.1=pyhd3deb0d_0
|
89 |
+
- requests-unixsocket=0.2.0=py_0
|
90 |
+
- send2trash=1.7.1=pyhd8ed1ab_0
|
91 |
+
- setuptools=52.0.0=py38h06a4308_0
|
92 |
+
- sniffio=1.2.0=py38h578d9bd_1
|
93 |
+
- sqlite=3.36.0=hc218d9a_0
|
94 |
+
- terminado=0.10.1=py38h578d9bd_0
|
95 |
+
- testpath=0.5.0=pyhd8ed1ab_0
|
96 |
+
- tk=8.6.10=hbc83047_0
|
97 |
+
- tornado=6.1=py38h497a2fe_1
|
98 |
+
- traitlets=5.0.5=py_0
|
99 |
+
- typing_extensions=3.10.0.0=pyha770c72_0
|
100 |
+
- urllib3=1.26.6=pyhd8ed1ab_0
|
101 |
+
- wcwidth=0.2.5=pyh9f0ad1d_2
|
102 |
+
- webencodings=0.5.1=py_1
|
103 |
+
- websocket-client=0.57.0=py38h578d9bd_4
|
104 |
+
- wheel=0.36.2=pyhd3eb1b0_0
|
105 |
+
- xz=5.2.5=h7b6447c_0
|
106 |
+
- zeromq=4.3.4=h9c3ff4c_0
|
107 |
+
- zipp=3.5.0=pyhd8ed1ab_0
|
108 |
+
- zlib=1.2.11=h7b6447c_3
|
109 |
+
- pip:
|
110 |
+
- absl-py==0.13.0
|
111 |
+
- aiohttp==3.7.4.post0
|
112 |
+
- astunparse==1.6.3
|
113 |
+
- async-timeout==3.0.1
|
114 |
+
- cachetools==4.2.2
|
115 |
+
- chex==0.0.8
|
116 |
+
- click==8.0.1
|
117 |
+
- configparser==5.0.2
|
118 |
+
- cycler==0.10.0
|
119 |
+
- dill==0.3.4
|
120 |
+
- dm-tree==0.1.6
|
121 |
+
- docker-pycreds==0.4.0
|
122 |
+
- filelock==3.0.12
|
123 |
+
- flatbuffers==1.12
|
124 |
+
- flax==0.3.4
|
125 |
+
- fsspec==2021.6.1
|
126 |
+
- gast==0.4.0
|
127 |
+
- gitdb==4.0.7
|
128 |
+
- gitpython==3.1.18
|
129 |
+
- google-auth==1.32.1
|
130 |
+
- google-auth-oauthlib==0.4.4
|
131 |
+
- google-pasta==0.2.0
|
132 |
+
- grpcio==1.34.1
|
133 |
+
- h5py==3.1.0
|
134 |
+
- huggingface-hub==0.0.12
|
135 |
+
- jax==0.2.16
|
136 |
+
- jaxlib==0.1.68
|
137 |
+
- joblib==1.0.1
|
138 |
+
- keras-nightly==2.5.0.dev2021032900
|
139 |
+
- keras-preprocessing==1.1.2
|
140 |
+
- kiwisolver==1.3.1
|
141 |
+
- libtpu-nightly==0.1.dev20210615
|
142 |
+
- markdown==3.3.4
|
143 |
+
- matplotlib==3.4.2
|
144 |
+
- msgpack==1.0.2
|
145 |
+
- multidict==5.1.0
|
146 |
+
- multiprocess==0.70.12.2
|
147 |
+
- numpy==1.19.5
|
148 |
+
- oauthlib==3.1.1
|
149 |
+
- opt-einsum==3.3.0
|
150 |
+
- optax==0.0.9
|
151 |
+
- packaging==20.9
|
152 |
+
- pandas==1.2.5
|
153 |
+
- pathtools==0.1.2
|
154 |
+
- pillow==8.3.0
|
155 |
+
- promise==2.3
|
156 |
+
- protobuf==3.17.3
|
157 |
+
- psutil==5.8.0
|
158 |
+
- pyarrow==4.0.1
|
159 |
+
- pyasn1==0.4.8
|
160 |
+
- pyasn1-modules==0.2.8
|
161 |
+
- pyyaml==5.4.1
|
162 |
+
- regex==2021.7.1
|
163 |
+
- requests-oauthlib==1.3.0
|
164 |
+
- rsa==4.7.2
|
165 |
+
- sacremoses==0.0.45
|
166 |
+
- scipy==1.7.0
|
167 |
+
- sentry-sdk==1.1.0
|
168 |
+
- shortuuid==1.0.1
|
169 |
+
- six==1.15.0
|
170 |
+
- smmap==4.0.0
|
171 |
+
- subprocess32==3.5.4
|
172 |
+
- tensorboard==2.5.0
|
173 |
+
- tensorboard-data-server==0.6.1
|
174 |
+
- tensorboard-plugin-wit==1.8.0
|
175 |
+
- tensorflow==2.5.0
|
176 |
+
- tensorflow-estimator==2.5.0
|
177 |
+
- termcolor==1.1.0
|
178 |
+
- tokenizers==0.10.3
|
179 |
+
- toolz==0.11.1
|
180 |
+
- tqdm==4.61.1
|
181 |
+
- typing-extensions==3.7.4.3
|
182 |
+
- wandb==0.10.33
|
183 |
+
- werkzeug==2.0.1
|
184 |
+
- wrapt==1.12.1
|
185 |
+
- xxhash==2.0.2
|
186 |
+
- yarl==1.6.3
|
187 |
+
prefix: /home/cahya/miniconda3/envs/jax
|
wandb/run-20210709_144100-2k1kyrq2/files/config.yaml
ADDED
@@ -0,0 +1,305 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
wandb_version: 1
|
2 |
+
|
3 |
+
__cached__setup_devices:
|
4 |
+
desc: null
|
5 |
+
value: cpu
|
6 |
+
_n_gpu:
|
7 |
+
desc: null
|
8 |
+
value: 0
|
9 |
+
_wandb:
|
10 |
+
desc: null
|
11 |
+
value:
|
12 |
+
cli_version: 0.10.33
|
13 |
+
framework: huggingface
|
14 |
+
huggingface_version: 4.9.0.dev0
|
15 |
+
is_jupyter_run: false
|
16 |
+
is_kaggle_kernel: false
|
17 |
+
python_version: 3.8.10
|
18 |
+
t:
|
19 |
+
1:
|
20 |
+
- 1
|
21 |
+
- 3
|
22 |
+
- 11
|
23 |
+
4: 3.8.10
|
24 |
+
5: 0.10.33
|
25 |
+
6: 4.9.0.dev0
|
26 |
+
8:
|
27 |
+
- 5
|
28 |
+
adafactor:
|
29 |
+
desc: null
|
30 |
+
value: false
|
31 |
+
adam_beta1:
|
32 |
+
desc: null
|
33 |
+
value: 0.9
|
34 |
+
adam_beta2:
|
35 |
+
desc: null
|
36 |
+
value: 0.98
|
37 |
+
adam_epsilon:
|
38 |
+
desc: null
|
39 |
+
value: 1.0e-08
|
40 |
+
block_size:
|
41 |
+
desc: null
|
42 |
+
value: 512
|
43 |
+
cache_dir:
|
44 |
+
desc: null
|
45 |
+
value: null
|
46 |
+
config_name:
|
47 |
+
desc: null
|
48 |
+
value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
|
49 |
+
dataloader_drop_last:
|
50 |
+
desc: null
|
51 |
+
value: false
|
52 |
+
dataloader_num_workers:
|
53 |
+
desc: null
|
54 |
+
value: 64
|
55 |
+
dataloader_pin_memory:
|
56 |
+
desc: null
|
57 |
+
value: true
|
58 |
+
dataset_config_name:
|
59 |
+
desc: null
|
60 |
+
value: unshuffled_deduplicated_id
|
61 |
+
dataset_name:
|
62 |
+
desc: null
|
63 |
+
value: oscar
|
64 |
+
ddp_find_unused_parameters:
|
65 |
+
desc: null
|
66 |
+
value: null
|
67 |
+
debug:
|
68 |
+
desc: null
|
69 |
+
value: []
|
70 |
+
deepspeed:
|
71 |
+
desc: null
|
72 |
+
value: null
|
73 |
+
disable_tqdm:
|
74 |
+
desc: null
|
75 |
+
value: false
|
76 |
+
do_eval:
|
77 |
+
desc: null
|
78 |
+
value: true
|
79 |
+
do_predict:
|
80 |
+
desc: null
|
81 |
+
value: false
|
82 |
+
do_train:
|
83 |
+
desc: null
|
84 |
+
value: true
|
85 |
+
dtype:
|
86 |
+
desc: null
|
87 |
+
value: float32
|
88 |
+
eval_accumulation_steps:
|
89 |
+
desc: null
|
90 |
+
value: null
|
91 |
+
eval_steps:
|
92 |
+
desc: null
|
93 |
+
value: 5000
|
94 |
+
evaluation_strategy:
|
95 |
+
desc: null
|
96 |
+
value: IntervalStrategy.NO
|
97 |
+
fp16:
|
98 |
+
desc: null
|
99 |
+
value: false
|
100 |
+
fp16_backend:
|
101 |
+
desc: null
|
102 |
+
value: auto
|
103 |
+
fp16_full_eval:
|
104 |
+
desc: null
|
105 |
+
value: false
|
106 |
+
fp16_opt_level:
|
107 |
+
desc: null
|
108 |
+
value: O1
|
109 |
+
gradient_accumulation_steps:
|
110 |
+
desc: null
|
111 |
+
value: 1
|
112 |
+
greater_is_better:
|
113 |
+
desc: null
|
114 |
+
value: null
|
115 |
+
group_by_length:
|
116 |
+
desc: null
|
117 |
+
value: false
|
118 |
+
ignore_data_skip:
|
119 |
+
desc: null
|
120 |
+
value: false
|
121 |
+
label_names:
|
122 |
+
desc: null
|
123 |
+
value: null
|
124 |
+
label_smoothing_factor:
|
125 |
+
desc: null
|
126 |
+
value: 0.0
|
127 |
+
learning_rate:
|
128 |
+
desc: null
|
129 |
+
value: 0.0024
|
130 |
+
length_column_name:
|
131 |
+
desc: null
|
132 |
+
value: length
|
133 |
+
load_best_model_at_end:
|
134 |
+
desc: null
|
135 |
+
value: false
|
136 |
+
local_rank:
|
137 |
+
desc: null
|
138 |
+
value: -1
|
139 |
+
log_level:
|
140 |
+
desc: null
|
141 |
+
value: -1
|
142 |
+
log_level_replica:
|
143 |
+
desc: null
|
144 |
+
value: -1
|
145 |
+
log_on_each_node:
|
146 |
+
desc: null
|
147 |
+
value: true
|
148 |
+
logging_dir:
|
149 |
+
desc: null
|
150 |
+
value: /home/cahya/Work/flax-community/gpt2-medium-indonesian/runs/Jul09_14-41-04_t1v-n-528d9406-w-0
|
151 |
+
logging_first_step:
|
152 |
+
desc: null
|
153 |
+
value: false
|
154 |
+
logging_steps:
|
155 |
+
desc: null
|
156 |
+
value: 5000
|
157 |
+
logging_strategy:
|
158 |
+
desc: null
|
159 |
+
value: IntervalStrategy.STEPS
|
160 |
+
lr_scheduler_type:
|
161 |
+
desc: null
|
162 |
+
value: SchedulerType.LINEAR
|
163 |
+
max_eval_samples:
|
164 |
+
desc: null
|
165 |
+
value: null
|
166 |
+
max_grad_norm:
|
167 |
+
desc: null
|
168 |
+
value: 1.0
|
169 |
+
max_steps:
|
170 |
+
desc: null
|
171 |
+
value: -1
|
172 |
+
max_train_samples:
|
173 |
+
desc: null
|
174 |
+
value: null
|
175 |
+
metric_for_best_model:
|
176 |
+
desc: null
|
177 |
+
value: null
|
178 |
+
model_name_or_path:
|
179 |
+
desc: null
|
180 |
+
value: null
|
181 |
+
model_type:
|
182 |
+
desc: null
|
183 |
+
value: gpt2
|
184 |
+
mp_parameters:
|
185 |
+
desc: null
|
186 |
+
value: ''
|
187 |
+
no_cuda:
|
188 |
+
desc: null
|
189 |
+
value: false
|
190 |
+
num_train_epochs:
|
191 |
+
desc: null
|
192 |
+
value: 20.0
|
193 |
+
output_dir:
|
194 |
+
desc: null
|
195 |
+
value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
|
196 |
+
overwrite_cache:
|
197 |
+
desc: null
|
198 |
+
value: false
|
199 |
+
overwrite_output_dir:
|
200 |
+
desc: null
|
201 |
+
value: true
|
202 |
+
past_index:
|
203 |
+
desc: null
|
204 |
+
value: -1
|
205 |
+
per_device_eval_batch_size:
|
206 |
+
desc: null
|
207 |
+
value: 24
|
208 |
+
per_device_train_batch_size:
|
209 |
+
desc: null
|
210 |
+
value: 24
|
211 |
+
per_gpu_eval_batch_size:
|
212 |
+
desc: null
|
213 |
+
value: null
|
214 |
+
per_gpu_train_batch_size:
|
215 |
+
desc: null
|
216 |
+
value: null
|
217 |
+
prediction_loss_only:
|
218 |
+
desc: null
|
219 |
+
value: false
|
220 |
+
preprocessing_num_workers:
|
221 |
+
desc: null
|
222 |
+
value: 64
|
223 |
+
push_to_hub:
|
224 |
+
desc: null
|
225 |
+
value: true
|
226 |
+
push_to_hub_model_id:
|
227 |
+
desc: null
|
228 |
+
value: gpt2-medium-indonesian
|
229 |
+
push_to_hub_organization:
|
230 |
+
desc: null
|
231 |
+
value: null
|
232 |
+
push_to_hub_token:
|
233 |
+
desc: null
|
234 |
+
value: null
|
235 |
+
remove_unused_columns:
|
236 |
+
desc: null
|
237 |
+
value: true
|
238 |
+
report_to:
|
239 |
+
desc: null
|
240 |
+
value:
|
241 |
+
- tensorboard
|
242 |
+
- wandb
|
243 |
+
resume_from_checkpoint:
|
244 |
+
desc: null
|
245 |
+
value: null
|
246 |
+
run_name:
|
247 |
+
desc: null
|
248 |
+
value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
|
249 |
+
save_on_each_node:
|
250 |
+
desc: null
|
251 |
+
value: false
|
252 |
+
save_steps:
|
253 |
+
desc: null
|
254 |
+
value: 5000
|
255 |
+
save_strategy:
|
256 |
+
desc: null
|
257 |
+
value: IntervalStrategy.STEPS
|
258 |
+
save_total_limit:
|
259 |
+
desc: null
|
260 |
+
value: null
|
261 |
+
seed:
|
262 |
+
desc: null
|
263 |
+
value: 42
|
264 |
+
sharded_ddp:
|
265 |
+
desc: null
|
266 |
+
value: []
|
267 |
+
skip_memory_metrics:
|
268 |
+
desc: null
|
269 |
+
value: true
|
270 |
+
test_log:
|
271 |
+
desc: null
|
272 |
+
value: 12345
|
273 |
+
tokenizer_name:
|
274 |
+
desc: null
|
275 |
+
value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
|
276 |
+
tpu_metrics_debug:
|
277 |
+
desc: null
|
278 |
+
value: false
|
279 |
+
tpu_num_cores:
|
280 |
+
desc: null
|
281 |
+
value: null
|
282 |
+
train_file:
|
283 |
+
desc: null
|
284 |
+
value: null
|
285 |
+
use_fast_tokenizer:
|
286 |
+
desc: null
|
287 |
+
value: true
|
288 |
+
use_legacy_prediction_loop:
|
289 |
+
desc: null
|
290 |
+
value: false
|
291 |
+
validation_file:
|
292 |
+
desc: null
|
293 |
+
value: null
|
294 |
+
validation_split_percentage:
|
295 |
+
desc: null
|
296 |
+
value: 2
|
297 |
+
warmup_ratio:
|
298 |
+
desc: null
|
299 |
+
value: 0.0
|
300 |
+
warmup_steps:
|
301 |
+
desc: null
|
302 |
+
value: 1000
|
303 |
+
weight_decay:
|
304 |
+
desc: null
|
305 |
+
value: 0.01
|
wandb/run-20210709_144100-2k1kyrq2/files/events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
/home/cahya/Work/flax-community/gpt2-medium-indonesian/events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2
|
wandb/run-20210709_144100-2k1kyrq2/files/output.log
ADDED
The diff for this file is too large to render.
See raw diff
|
|
wandb/run-20210709_144100-2k1kyrq2/files/requirements.txt
ADDED
@@ -0,0 +1,153 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
absl-py==0.13.0
|
2 |
+
aiohttp==3.7.4.post0
|
3 |
+
anyio==3.2.1
|
4 |
+
argon2-cffi==20.1.0
|
5 |
+
astunparse==1.6.3
|
6 |
+
async-generator==1.10
|
7 |
+
async-timeout==3.0.1
|
8 |
+
attrs==21.2.0
|
9 |
+
babel==2.9.1
|
10 |
+
backcall==0.2.0
|
11 |
+
backports.functools-lru-cache==1.6.4
|
12 |
+
bleach==3.3.0
|
13 |
+
brotlipy==0.7.0
|
14 |
+
cachetools==4.2.2
|
15 |
+
certifi==2021.5.30
|
16 |
+
cffi==1.14.5
|
17 |
+
chardet==4.0.0
|
18 |
+
chex==0.0.8
|
19 |
+
click==8.0.1
|
20 |
+
configparser==5.0.2
|
21 |
+
cryptography==3.4.7
|
22 |
+
cycler==0.10.0
|
23 |
+
datasets==1.8.1.dev0
|
24 |
+
debugpy==1.3.0
|
25 |
+
decorator==5.0.9
|
26 |
+
defusedxml==0.7.1
|
27 |
+
dill==0.3.4
|
28 |
+
dm-tree==0.1.6
|
29 |
+
docker-pycreds==0.4.0
|
30 |
+
entrypoints==0.3
|
31 |
+
filelock==3.0.12
|
32 |
+
flatbuffers==1.12
|
33 |
+
flax==0.3.4
|
34 |
+
fsspec==2021.6.1
|
35 |
+
gast==0.4.0
|
36 |
+
gitdb==4.0.7
|
37 |
+
gitpython==3.1.18
|
38 |
+
google-auth-oauthlib==0.4.4
|
39 |
+
google-auth==1.32.1
|
40 |
+
google-pasta==0.2.0
|
41 |
+
grpcio==1.34.1
|
42 |
+
h5py==3.1.0
|
43 |
+
huggingface-hub==0.0.12
|
44 |
+
idna==2.10
|
45 |
+
importlib-metadata==4.6.1
|
46 |
+
ipykernel==6.0.1
|
47 |
+
ipython-genutils==0.2.0
|
48 |
+
ipython==7.25.0
|
49 |
+
jax==0.2.16
|
50 |
+
jaxlib==0.1.68
|
51 |
+
jedi==0.18.0
|
52 |
+
jinja2==3.0.1
|
53 |
+
joblib==1.0.1
|
54 |
+
json5==0.9.5
|
55 |
+
jsonschema==3.2.0
|
56 |
+
jupyter-client==6.1.12
|
57 |
+
jupyter-core==4.7.1
|
58 |
+
jupyter-server==1.9.0
|
59 |
+
jupyterlab-pygments==0.1.2
|
60 |
+
jupyterlab-server==2.6.0
|
61 |
+
jupyterlab==3.0.16
|
62 |
+
keras-nightly==2.5.0.dev2021032900
|
63 |
+
keras-preprocessing==1.1.2
|
64 |
+
kiwisolver==1.3.1
|
65 |
+
libtpu-nightly==0.1.dev20210615
|
66 |
+
markdown==3.3.4
|
67 |
+
markupsafe==2.0.1
|
68 |
+
matplotlib-inline==0.1.2
|
69 |
+
matplotlib==3.4.2
|
70 |
+
mistune==0.8.4
|
71 |
+
msgpack==1.0.2
|
72 |
+
multidict==5.1.0
|
73 |
+
multiprocess==0.70.12.2
|
74 |
+
nbclassic==0.3.1
|
75 |
+
nbclient==0.5.3
|
76 |
+
nbconvert==6.1.0
|
77 |
+
nbformat==5.1.3
|
78 |
+
nest-asyncio==1.5.1
|
79 |
+
notebook==6.4.0
|
80 |
+
numpy==1.19.5
|
81 |
+
oauthlib==3.1.1
|
82 |
+
opt-einsum==3.3.0
|
83 |
+
optax==0.0.9
|
84 |
+
packaging==21.0
|
85 |
+
pandas==1.2.5
|
86 |
+
pandocfilters==1.4.2
|
87 |
+
parso==0.8.2
|
88 |
+
pathtools==0.1.2
|
89 |
+
pexpect==4.8.0
|
90 |
+
pickleshare==0.7.5
|
91 |
+
pillow==8.3.0
|
92 |
+
pip==21.1.3
|
93 |
+
prometheus-client==0.11.0
|
94 |
+
promise==2.3
|
95 |
+
prompt-toolkit==3.0.19
|
96 |
+
protobuf==3.17.3
|
97 |
+
psutil==5.8.0
|
98 |
+
ptyprocess==0.7.0
|
99 |
+
pyarrow==4.0.1
|
100 |
+
pyasn1-modules==0.2.8
|
101 |
+
pyasn1==0.4.8
|
102 |
+
pycparser==2.20
|
103 |
+
pygments==2.9.0
|
104 |
+
pyopenssl==20.0.1
|
105 |
+
pyparsing==2.4.7
|
106 |
+
pyrsistent==0.17.3
|
107 |
+
pysocks==1.7.1
|
108 |
+
python-dateutil==2.8.1
|
109 |
+
pytz==2021.1
|
110 |
+
pyyaml==5.4.1
|
111 |
+
pyzmq==22.1.0
|
112 |
+
regex==2021.7.1
|
113 |
+
requests-oauthlib==1.3.0
|
114 |
+
requests-unixsocket==0.2.0
|
115 |
+
requests==2.25.1
|
116 |
+
rsa==4.7.2
|
117 |
+
sacremoses==0.0.45
|
118 |
+
scipy==1.7.0
|
119 |
+
send2trash==1.7.1
|
120 |
+
sentry-sdk==1.1.0
|
121 |
+
setuptools==52.0.0.post20210125
|
122 |
+
shortuuid==1.0.1
|
123 |
+
six==1.16.0
|
124 |
+
smmap==4.0.0
|
125 |
+
sniffio==1.2.0
|
126 |
+
subprocess32==3.5.4
|
127 |
+
tensorboard-data-server==0.6.1
|
128 |
+
tensorboard-plugin-wit==1.8.0
|
129 |
+
tensorboard==2.5.0
|
130 |
+
tensorflow-estimator==2.5.0
|
131 |
+
tensorflow==2.5.0
|
132 |
+
termcolor==1.1.0
|
133 |
+
terminado==0.10.1
|
134 |
+
testpath==0.5.0
|
135 |
+
tokenizers==0.10.3
|
136 |
+
toolz==0.11.1
|
137 |
+
torch==1.9.0
|
138 |
+
tornado==6.1
|
139 |
+
tqdm==4.61.1
|
140 |
+
traitlets==5.0.5
|
141 |
+
transformers==4.9.0.dev0
|
142 |
+
typing-extensions==3.10.0.0
|
143 |
+
urllib3==1.26.6
|
144 |
+
wandb==0.10.33
|
145 |
+
wcwidth==0.2.5
|
146 |
+
webencodings==0.5.1
|
147 |
+
websocket-client==0.57.0
|
148 |
+
werkzeug==2.0.1
|
149 |
+
wheel==0.36.2
|
150 |
+
wrapt==1.12.1
|
151 |
+
xxhash==2.0.2
|
152 |
+
yarl==1.6.3
|
153 |
+
zipp==3.5.0
|
wandb/run-20210709_144100-2k1kyrq2/files/wandb-metadata.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"os": "Linux-5.4.0-1043-gcp-x86_64-with-glibc2.17",
|
3 |
+
"python": "3.8.10",
|
4 |
+
"heartbeatAt": "2021-07-09T14:41:02.325218",
|
5 |
+
"startedAt": "2021-07-09T14:41:00.270917",
|
6 |
+
"docker": null,
|
7 |
+
"cpu_count": 96,
|
8 |
+
"cuda": null,
|
9 |
+
"args": [
|
10 |
+
"--output_dir=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
|
11 |
+
"--model_type=gpt2",
|
12 |
+
"--config_name=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
|
13 |
+
"--tokenizer_name=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
|
14 |
+
"--dataset_name=oscar",
|
15 |
+
"--dataset_config_name=unshuffled_deduplicated_id",
|
16 |
+
"--do_train",
|
17 |
+
"--do_eval",
|
18 |
+
"--block_size=512",
|
19 |
+
"--per_device_train_batch_size=24",
|
20 |
+
"--per_device_eval_batch_size=24",
|
21 |
+
"--learning_rate=0.0024",
|
22 |
+
"--warmup_steps=1000",
|
23 |
+
"--adam_beta1=0.9",
|
24 |
+
"--adam_beta2=0.98",
|
25 |
+
"--weight_decay=0.01",
|
26 |
+
"--overwrite_output_dir",
|
27 |
+
"--num_train_epochs=20",
|
28 |
+
"--dataloader_num_workers=64",
|
29 |
+
"--preprocessing_num_workers=64",
|
30 |
+
"--logging_steps=5000",
|
31 |
+
"--save_steps=5000",
|
32 |
+
"--eval_steps=5000",
|
33 |
+
"--validation_split_percentage=2",
|
34 |
+
"--push_to_hub"
|
35 |
+
],
|
36 |
+
"state": "running",
|
37 |
+
"program": "./run_clm_flax.py",
|
38 |
+
"codePath": "run_clm_flax.py",
|
39 |
+
"git": {
|
40 |
+
"remote": "https://huggingface.co/flax-community/gpt2-medium-indonesian",
|
41 |
+
"commit": "9b9473462e797993d7ca4cfb92daa71c0bc81e9d"
|
42 |
+
},
|
43 |
+
"email": "[email protected]",
|
44 |
+
"root": "/home/cahya/Work/flax-community/gpt2-medium-indonesian",
|
45 |
+
"host": "t1v-n-528d9406-w-0",
|
46 |
+
"username": "cahya",
|
47 |
+
"executable": "/home/cahya/miniconda3/envs/jax/bin/python"
|
48 |
+
}
|
wandb/run-20210709_144100-2k1kyrq2/files/wandb-summary.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"global_step": 5000, "_timestamp": 1625848638.071834, "train_time": 5622.2197265625, "train_learning_rate": 0.00238410709425807, "_step": 9997, "train_loss": 3.5673484802246094}
|
wandb/run-20210709_144100-2k1kyrq2/logs/debug-internal.log
ADDED
The diff for this file is too large to render.
See raw diff
|
|
wandb/run-20210709_144100-2k1kyrq2/logs/debug.log
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] Unhandled environment var: WANDB_LOG_MODEL
|
2 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] setting env: {'project': 'hf-flax-gpt2-indonesian', 'entity': 'wandb'}
|
3 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] setting login settings: {}
|
4 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:_log_setup():337] Logging user logs to /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_144100-2k1kyrq2/logs/debug.log
|
5 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:_log_setup():338] Logging internal logs to /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_144100-2k1kyrq2/logs/debug-internal.log
|
6 |
+
2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:init():370] calling init triggers
|
7 |
+
2021-07-09 14:41:00,273 INFO MainThread:250031 [wandb_init.py:init():375] wandb.init called with sweep_config: {}
|
8 |
+
config: {}
|
9 |
+
2021-07-09 14:41:00,273 INFO MainThread:250031 [wandb_init.py:init():419] starting backend
|
10 |
+
2021-07-09 14:41:00,273 INFO MainThread:250031 [backend.py:_multiprocessing_setup():70] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
11 |
+
2021-07-09 14:41:00,314 INFO MainThread:250031 [backend.py:ensure_launched():135] starting backend process...
|
12 |
+
2021-07-09 14:41:00,353 INFO MainThread:250031 [backend.py:ensure_launched():139] started backend process with pid: 251111
|
13 |
+
2021-07-09 14:41:00,355 INFO MainThread:250031 [wandb_init.py:init():424] backend started and connected
|
14 |
+
2021-07-09 14:41:00,357 INFO MainThread:250031 [wandb_init.py:init():472] updated telemetry
|
15 |
+
2021-07-09 14:41:00,358 INFO MainThread:250031 [wandb_init.py:init():491] communicating current version
|
16 |
+
2021-07-09 14:41:01,006 INFO MainThread:250031 [wandb_init.py:init():496] got version response
|
17 |
+
2021-07-09 14:41:01,006 INFO MainThread:250031 [wandb_init.py:init():504] communicating run to backend with 30 second timeout
|
18 |
+
2021-07-09 14:41:01,184 INFO MainThread:250031 [wandb_init.py:init():529] starting run threads in backend
|
19 |
+
2021-07-09 14:41:04,780 INFO MainThread:250031 [wandb_run.py:_console_start():1623] atexit reg
|
20 |
+
2021-07-09 14:41:04,781 INFO MainThread:250031 [wandb_run.py:_redirect():1497] redirect: SettingsConsole.REDIRECT
|
21 |
+
2021-07-09 14:41:04,782 INFO MainThread:250031 [wandb_run.py:_redirect():1502] Redirecting console.
|
22 |
+
2021-07-09 14:41:04,783 INFO MainThread:250031 [wandb_run.py:_redirect():1558] Redirects installed.
|
23 |
+
2021-07-09 14:41:04,784 INFO MainThread:250031 [wandb_init.py:init():554] run started, returning control to user process
|
24 |
+
2021-07-09 14:41:04,793 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'output_dir': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'IntervalStrategy.NO', 'prediction_loss_only': False, 'per_device_train_batch_size': 24, 'per_device_eval_batch_size': 24, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'learning_rate': 0.0024, 'weight_decay': 0.01, 'adam_beta1': 0.9, 'adam_beta2': 0.98, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 20.0, 'max_steps': -1, 'lr_scheduler_type': 'SchedulerType.LINEAR', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': '/home/cahya/Work/flax-community/gpt2-medium-indonesian/runs/Jul09_14-41-04_t1v-n-528d9406-w-0', 'logging_strategy': 'IntervalStrategy.STEPS', 'logging_first_step': False, 'logging_steps': 5000, 'save_strategy': 'IntervalStrategy.STEPS', 'save_steps': 5000, 'save_total_limit': None, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'fp16': False, 'fp16_opt_level': 'O1', 'fp16_backend': 'auto', 'fp16_full_eval': False, 'local_rank': -1, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 5000, 'dataloader_num_workers': 64, 'past_index': -1, 'run_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'sharded_ddp': [], 'deepspeed': None, 'label_smoothing_factor': 0.0, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'push_to_hub_model_id': 'gpt2-medium-indonesian', 'push_to_hub_organization': None, 'push_to_hub_token': None, 'mp_parameters': '', '_n_gpu': 0, '__cached__setup_devices': 'cpu'}
|
25 |
+
2021-07-09 14:41:04,794 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'model_name_or_path': None, 'model_type': 'gpt2', 'config_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'tokenizer_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'cache_dir': None, 'use_fast_tokenizer': True, 'dtype': 'float32'}
|
26 |
+
2021-07-09 14:41:04,794 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'dataset_name': 'oscar', 'dataset_config_name': 'unshuffled_deduplicated_id', 'train_file': None, 'validation_file': None, 'max_train_samples': None, 'max_eval_samples': None, 'overwrite_cache': False, 'validation_split_percentage': 2, 'block_size': 512, 'preprocessing_num_workers': 64}
|
27 |
+
2021-07-09 14:41:04,795 INFO MainThread:250031 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f3836ca5a90>>
|
28 |
+
2021-07-09 14:41:04,795 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
|
29 |
+
2021-07-09 15:03:23,473 INFO MainThread:250031 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
|
wandb/run-20210709_144100-2k1kyrq2/run-2k1kyrq2.wandb
ADDED
Binary file (1.4 MB). View file
|
|