cahya commited on
Commit
735daf5
1 Parent(s): 9b94734

Saving weights and logs of step 5000

Browse files
events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65f1a7d1164ca3b62fcc3dea900488379e35e8dbc651d2d586a093e695813bb7
3
+ size 735138
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68d1eca2a3ae4fc5ba1ba43e64ef83cd58cf8add1c0aee8478bf5651b0bcd130
3
  size 1419302302
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c82df389e510b831d9a5c33f348a258ef105f78170ccc3efd78ab838d40a038b
3
  size 1419302302
run_pretraining.sh CHANGED
@@ -20,8 +20,8 @@ export WANDB_LOG_MODEL="true"
20
  --num_train_epochs="20" \
21
  --dataloader_num_workers="64" \
22
  --preprocessing_num_workers="64" \
23
- --save_steps="10" \
24
- --eval_steps="10" \
25
- --max_train_samples="10000" \
26
- --max_eval_samples="1000" \
27
  --push_to_hub
 
20
  --num_train_epochs="20" \
21
  --dataloader_num_workers="64" \
22
  --preprocessing_num_workers="64" \
23
+ --logging_steps="5000" \
24
+ --save_steps="5000" \
25
+ --eval_steps="5000" \
26
+ --validation_split_percentage="2" \
27
  --push_to_hub
wandb/debug-internal.log CHANGED
@@ -1 +1 @@
1
- run-20210709_141445-2k8cnty2/logs/debug-internal.log
 
1
+ run-20210709_144100-2k1kyrq2/logs/debug-internal.log
wandb/debug.log CHANGED
@@ -1 +1 @@
1
- run-20210709_141445-2k8cnty2/logs/debug.log
 
1
+ run-20210709_144100-2k1kyrq2/logs/debug.log
wandb/latest-run CHANGED
@@ -1 +1 @@
1
- run-20210709_141445-2k8cnty2
 
1
+ run-20210709_144100-2k1kyrq2
wandb/run-20210709_141445-2k8cnty2/files/config.yaml CHANGED
@@ -20,6 +20,10 @@ _wandb:
20
  - 1
21
  - 3
22
  - 11
 
 
 
 
23
  4: 3.8.10
24
  5: 0.10.33
25
  6: 4.9.0.dev0
 
20
  - 1
21
  - 3
22
  - 11
23
+ 2:
24
+ - 1
25
+ - 3
26
+ - 11
27
  4: 3.8.10
28
  5: 0.10.33
29
  6: 4.9.0.dev0
wandb/run-20210709_141445-2k8cnty2/files/output.log CHANGED
@@ -528,3 +528,17 @@ Training...: 92%|████████████████████
528
  Evaluating...: 0%| | 0/5 [00:00<?, ?it/s]
529
 
530
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
528
  Evaluating...: 0%| | 0/5 [00:00<?, ?it/s]
529
 
530
 
531
+ Model weights saved in /home/cahya/Work/flax-community/gpt2-medium-indonesian/flax_model.msgpack██████████████████████████████████████████████████████████████████████████████████████████████████████ | 48/52 [05:47<00:06, 1.74s/it]
532
+ Model pushed to the hub in this commit: https://huggingface.co/flax-community/gpt2-medium-indonesian/commit/9b9473462e797993d7ca4cfb92daa71c0bc81e9d
533
+ Step... (100 | Eval Loss: 7.69423770904541 | Eval Perplexity: 2195.65944089946): 10%|████████████▌ | 2/20 [14:54<2:13:01, 443.41s/it]
534
+
535
+ Training...: 12%|██████████████████████▌ | 6/52 [00:01<00:10, 4.36it/s]
536
+ File "./run_clm_flax.py", line 655, in <module>
537
+ main()
538
+ File "./run_clm_flax.py", line 620, in main
539
+ batch = next(eval_loader)
540
+ File "./run_clm_flax.py", line 193, in data_loader
541
+ for idx in batch_idx:
542
+ File "/home/cahya/miniconda3/envs/jax/lib/python3.8/site-packages/jax/interpreters/xla.py", line 1264, in __iter__
543
+ return self._value.__iter__()
544
+ KeyboardInterrupt
wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"global_step": 90, "_timestamp": 1625840867.513841, "eval_loss": 7.724389553070068, "eval_perplexity": 2262.870849609375, "_step": 8}
 
1
+ {"global_step": 100, "_timestamp": 1625840946.414606, "eval_loss": 7.69423770904541, "eval_perplexity": 2195.659423828125, "_step": 9}
wandb/run-20210709_141445-2k8cnty2/logs/debug-internal.log CHANGED
@@ -330,3 +330,139 @@
330
  2021-07-09 14:29:24,657 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
331
  2021-07-09 14:29:28,577 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
332
  2021-07-09 14:29:28,578 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
330
  2021-07-09 14:29:24,657 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
331
  2021-07-09 14:29:28,577 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
332
  2021-07-09 14:29:28,578 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
333
+ 2021-07-09 14:29:43,713 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
334
+ 2021-07-09 14:29:43,713 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
335
+ 2021-07-09 14:29:47,814 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
336
+ 2021-07-09 14:29:58,843 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
337
+ 2021-07-09 14:29:58,844 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
338
+ 2021-07-09 14:30:13,979 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
339
+ 2021-07-09 14:30:13,980 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
340
+ 2021-07-09 14:30:17,889 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
341
+ 2021-07-09 14:30:24,683 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
342
+ 2021-07-09 14:30:26,684 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
343
+ 2021-07-09 14:30:28,685 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
344
+ 2021-07-09 14:30:29,111 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: stop_status
345
+ 2021-07-09 14:30:29,111 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: stop_status
346
+ 2021-07-09 14:30:30,097 WARNING MainThread:246776 [internal.py:wandb_internal():147] Internal process interrupt: 1
347
+ 2021-07-09 14:30:30,685 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
348
+ 2021-07-09 14:30:34,687 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
349
+ 2021-07-09 14:30:36,622 DEBUG SenderThread:246776 [sender.py:send():179] send: telemetry
350
+ 2021-07-09 14:30:36,622 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
351
+ 2021-07-09 14:30:36,622 DEBUG SenderThread:246776 [sender.py:send():179] send: exit
352
+ 2021-07-09 14:30:36,622 INFO SenderThread:246776 [sender.py:send_exit():287] handling exit code: 255
353
+ 2021-07-09 14:30:36,623 INFO SenderThread:246776 [sender.py:send_exit():295] send defer
354
+ 2021-07-09 14:30:36,623 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
355
+ 2021-07-09 14:30:36,624 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
356
+ 2021-07-09 14:30:36,624 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 0
357
+ 2021-07-09 14:30:36,624 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
358
+ 2021-07-09 14:30:36,624 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 0
359
+ 2021-07-09 14:30:36,624 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 1
360
+ 2021-07-09 14:30:36,624 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
361
+ 2021-07-09 14:30:36,624 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 1
362
+ 2021-07-09 14:30:36,631 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
363
+ 2021-07-09 14:30:36,631 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 1
364
+ 2021-07-09 14:30:36,631 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 2
365
+ 2021-07-09 14:30:36,631 DEBUG SenderThread:246776 [sender.py:send():179] send: stats
366
+ 2021-07-09 14:30:36,632 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
367
+ 2021-07-09 14:30:36,632 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 2
368
+ 2021-07-09 14:30:36,688 INFO Thread-8 :246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
369
+ 2021-07-09 14:30:42,961 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
370
+ 2021-07-09 14:30:42,961 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
371
+ 2021-07-09 14:30:42,961 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 2
372
+ 2021-07-09 14:30:42,961 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
373
+ 2021-07-09 14:30:42,961 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 3
374
+ 2021-07-09 14:30:42,962 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
375
+ 2021-07-09 14:30:42,962 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
376
+ 2021-07-09 14:30:42,963 DEBUG SenderThread:246776 [sender.py:send():179] send: history
377
+ 2021-07-09 14:30:42,963 DEBUG SenderThread:246776 [sender.py:send():179] send: summary
378
+ 2021-07-09 14:30:42,963 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
379
+ 2021-07-09 14:30:42,964 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 3
380
+ 2021-07-09 14:30:42,964 INFO SenderThread:246776 [sender.py:_save_file():841] saving file wandb-summary.json with policy end
381
+ 2021-07-09 14:30:42,964 DEBUG SenderThread:246776 [sender.py:send():179] send: summary
382
+ 2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:_save_file():841] saving file wandb-summary.json with policy end
383
+ 2021-07-09 14:30:42,965 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
384
+ 2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 3
385
+ 2021-07-09 14:30:42,965 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 4
386
+ 2021-07-09 14:30:42,965 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
387
+ 2021-07-09 14:30:42,965 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 4
388
+ 2021-07-09 14:30:42,965 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
389
+ 2021-07-09 14:30:42,966 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 4
390
+ 2021-07-09 14:30:43,065 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
391
+ 2021-07-09 14:30:43,170 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 5
392
+ 2021-07-09 14:30:43,170 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
393
+ 2021-07-09 14:30:43,171 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
394
+ 2021-07-09 14:30:43,171 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 5
395
+ 2021-07-09 14:30:43,171 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
396
+ 2021-07-09 14:30:43,171 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 5
397
+ 2021-07-09 14:30:43,171 INFO SenderThread:246776 [dir_watcher.py:finish():282] shutting down directory watcher
398
+ 2021-07-09 14:30:43,272 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
399
+ 2021-07-09 14:30:43,690 INFO SenderThread:246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml
400
+ 2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:_on_file_modified():229] file/dir modified: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json
401
+ 2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():312] scan: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files
402
+ 2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/conda-environment.yaml conda-environment.yaml
403
+ 2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/requirements.txt requirements.txt
404
+ 2021-07-09 14:30:43,691 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log output.log
405
+ 2021-07-09 14:30:43,692 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-metadata.json wandb-metadata.json
406
+ 2021-07-09 14:30:43,692 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml config.yaml
407
+ 2021-07-09 14:30:43,695 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2 events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2
408
+ 2021-07-09 14:30:43,695 INFO SenderThread:246776 [dir_watcher.py:finish():318] scan save: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json wandb-summary.json
409
+ 2021-07-09 14:30:43,695 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 6
410
+ 2021-07-09 14:30:43,695 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
411
+ 2021-07-09 14:30:43,696 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
412
+ 2021-07-09 14:30:43,705 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 6
413
+ 2021-07-09 14:30:43,705 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
414
+ 2021-07-09 14:30:43,705 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 6
415
+ 2021-07-09 14:30:43,705 INFO SenderThread:246776 [file_pusher.py:finish():177] shutting down file pusher
416
+ 2021-07-09 14:30:43,798 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
417
+ 2021-07-09 14:30:43,798 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
418
+ 2021-07-09 14:30:43,900 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
419
+ 2021-07-09 14:30:43,900 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
420
+ 2021-07-09 14:30:44,002 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
421
+ 2021-07-09 14:30:44,002 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
422
+ 2021-07-09 14:30:44,104 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
423
+ 2021-07-09 14:30:44,104 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
424
+ 2021-07-09 14:30:44,144 INFO Thread-24 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/config.yaml
425
+ 2021-07-09 14:30:44,145 INFO Thread-22 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/requirements.txt
426
+ 2021-07-09 14:30:44,154 INFO Thread-21 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/conda-environment.yaml
427
+ 2021-07-09 14:30:44,183 INFO Thread-26 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/wandb-summary.json
428
+ 2021-07-09 14:30:44,206 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
429
+ 2021-07-09 14:30:44,206 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
430
+ 2021-07-09 14:30:44,232 INFO Thread-25 :246776 [upload_job.py:push():137] Uploaded file /tmp/tmp4f0a6i2mwandb/i1mxdnz1-events.out.tfevents.1625840127.t1v-n-528d9406-w-0.245719.3.v2
431
+ 2021-07-09 14:30:44,307 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
432
+ 2021-07-09 14:30:44,308 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
433
+ 2021-07-09 14:30:44,359 INFO Thread-23 :246776 [upload_job.py:push():137] Uploaded file /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/files/output.log
434
+ 2021-07-09 14:30:44,409 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
435
+ 2021-07-09 14:30:44,409 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
436
+ 2021-07-09 14:30:44,511 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
437
+ 2021-07-09 14:30:44,511 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
438
+ 2021-07-09 14:30:44,559 INFO Thread-7 :246776 [sender.py:transition_state():308] send defer: 7
439
+ 2021-07-09 14:30:44,560 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
440
+ 2021-07-09 14:30:44,560 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 7
441
+ 2021-07-09 14:30:44,560 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
442
+ 2021-07-09 14:30:44,560 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 7
443
+ 2021-07-09 14:30:44,612 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
444
+ 2021-07-09 14:30:44,831 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 8
445
+ 2021-07-09 14:30:44,831 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
446
+ 2021-07-09 14:30:44,832 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
447
+ 2021-07-09 14:30:44,832 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 8
448
+ 2021-07-09 14:30:44,832 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
449
+ 2021-07-09 14:30:44,832 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 8
450
+ 2021-07-09 14:30:44,832 INFO SenderThread:246776 [sender.py:transition_state():308] send defer: 9
451
+ 2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send():179] send: final
452
+ 2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send():179] send: footer
453
+ 2021-07-09 14:30:44,833 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: defer
454
+ 2021-07-09 14:30:44,833 INFO HandlerThread:246776 [handler.py:handle_request_defer():141] handle defer: 9
455
+ 2021-07-09 14:30:44,833 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: defer
456
+ 2021-07-09 14:30:44,833 INFO SenderThread:246776 [sender.py:send_request_defer():304] handle sender defer: 9
457
+ 2021-07-09 14:30:44,933 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: poll_exit
458
+ 2021-07-09 14:30:44,933 DEBUG SenderThread:246776 [sender.py:send_request():193] send_request: poll_exit
459
+ 2021-07-09 14:30:44,933 INFO SenderThread:246776 [file_pusher.py:join():182] waiting for file pusher
460
+ 2021-07-09 14:30:44,935 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: get_summary
461
+ 2021-07-09 14:30:44,936 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: sampled_history
462
+ 2021-07-09 14:30:44,937 DEBUG HandlerThread:246776 [handler.py:handle_request():124] handle_request: shutdown
463
+ 2021-07-09 14:30:44,937 INFO HandlerThread:246776 [handler.py:finish():638] shutting down handler
464
+ 2021-07-09 14:30:45,833 INFO WriterThread:246776 [datastore.py:close():288] close: /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb
465
+ 2021-07-09 14:30:45,934 INFO SenderThread:246776 [sender.py:finish():945] shutting down sender
466
+ 2021-07-09 14:30:45,934 INFO SenderThread:246776 [file_pusher.py:finish():177] shutting down file pusher
467
+ 2021-07-09 14:30:45,934 INFO SenderThread:246776 [file_pusher.py:join():182] waiting for file pusher
468
+ 2021-07-09 14:30:45,936 INFO MainThread:246776 [internal.py:handle_exit():78] Internal process exited
wandb/run-20210709_141445-2k8cnty2/logs/debug.log CHANGED
@@ -27,3 +27,138 @@ config: {}
27
  2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fab4d59abb0>>
28
  2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
29
  2021-07-09 14:15:27,424 INFO MainThread:245719 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fab4d59abb0>>
28
  2021-07-09 14:14:49,958 INFO MainThread:245719 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
29
  2021-07-09 14:15:27,424 INFO MainThread:245719 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
30
+ 2021-07-09 14:30:34,276 INFO MainThread:245719 [wandb_run.py:_atexit_cleanup():1593] got exitcode: 255
31
+ 2021-07-09 14:30:34,276 INFO MainThread:245719 [wandb_run.py:_restore():1565] restore
32
+ 2021-07-09 14:30:36,624 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
33
+ wandb_count: 1
34
+ other_count: 1
35
+ }
36
+ pusher_stats {
37
+ uploaded_bytes: 3022
38
+ total_bytes: 3022
39
+ }
40
+
41
+ 2021-07-09 14:30:41,726 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: None
42
+ 2021-07-09 14:30:42,963 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
43
+ wandb_count: 1
44
+ other_count: 1
45
+ }
46
+ pusher_stats {
47
+ uploaded_bytes: 3022
48
+ total_bytes: 3022
49
+ }
50
+
51
+ 2021-07-09 14:30:43,171 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
52
+ wandb_count: 1
53
+ other_count: 1
54
+ }
55
+ pusher_stats {
56
+ uploaded_bytes: 3022
57
+ total_bytes: 3022
58
+ }
59
+
60
+ 2021-07-09 14:30:43,697 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
61
+ wandb_count: 5
62
+ other_count: 1
63
+ }
64
+ pusher_stats {
65
+ uploaded_bytes: 3022
66
+ total_bytes: 100895
67
+ }
68
+
69
+ 2021-07-09 14:30:43,799 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
70
+ wandb_count: 6
71
+ other_count: 1
72
+ }
73
+ pusher_stats {
74
+ uploaded_bytes: 1722
75
+ total_bytes: 101169
76
+ }
77
+
78
+ 2021-07-09 14:30:43,901 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
79
+ wandb_count: 6
80
+ other_count: 1
81
+ }
82
+ pusher_stats {
83
+ uploaded_bytes: 101169
84
+ total_bytes: 101169
85
+ }
86
+
87
+ 2021-07-09 14:30:44,003 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
88
+ wandb_count: 6
89
+ other_count: 1
90
+ }
91
+ pusher_stats {
92
+ uploaded_bytes: 101169
93
+ total_bytes: 101169
94
+ }
95
+
96
+ 2021-07-09 14:30:44,104 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
97
+ wandb_count: 6
98
+ other_count: 1
99
+ }
100
+ pusher_stats {
101
+ uploaded_bytes: 101169
102
+ total_bytes: 101169
103
+ }
104
+
105
+ 2021-07-09 14:30:44,206 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
106
+ wandb_count: 6
107
+ other_count: 1
108
+ }
109
+ pusher_stats {
110
+ uploaded_bytes: 101169
111
+ total_bytes: 101169
112
+ }
113
+
114
+ 2021-07-09 14:30:44,308 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
115
+ wandb_count: 6
116
+ other_count: 1
117
+ }
118
+ pusher_stats {
119
+ uploaded_bytes: 101169
120
+ total_bytes: 101169
121
+ }
122
+
123
+ 2021-07-09 14:30:44,410 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
124
+ wandb_count: 6
125
+ other_count: 1
126
+ }
127
+ pusher_stats {
128
+ uploaded_bytes: 101169
129
+ total_bytes: 101169
130
+ }
131
+
132
+ 2021-07-09 14:30:44,511 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
133
+ wandb_count: 6
134
+ other_count: 1
135
+ }
136
+ pusher_stats {
137
+ uploaded_bytes: 101169
138
+ total_bytes: 101169
139
+ }
140
+
141
+ 2021-07-09 14:30:44,832 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: file_counts {
142
+ wandb_count: 6
143
+ other_count: 1
144
+ }
145
+ pusher_stats {
146
+ uploaded_bytes: 101169
147
+ total_bytes: 101169
148
+ }
149
+
150
+ 2021-07-09 14:30:44,934 INFO MainThread:245719 [wandb_run.py:_wait_for_finish():1715] got exit ret: done: true
151
+ exit_result {
152
+ }
153
+ file_counts {
154
+ wandb_count: 6
155
+ other_count: 1
156
+ }
157
+ pusher_stats {
158
+ uploaded_bytes: 101169
159
+ total_bytes: 101169
160
+ }
161
+
162
+ 2021-07-09 14:30:46,219 INFO MainThread:245719 [wandb_run.py:_show_summary():1870] rendering summary
163
+ 2021-07-09 14:30:46,220 INFO MainThread:245719 [wandb_run.py:_show_history():1908] rendering history
164
+ 2021-07-09 14:30:46,220 INFO MainThread:245719 [wandb_run.py:_show_files():1937] logging synced files
wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb CHANGED
Binary files a/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb and b/wandb/run-20210709_141445-2k8cnty2/run-2k8cnty2.wandb differ
 
wandb/run-20210709_144100-2k1kyrq2/files/conda-environment.yaml ADDED
@@ -0,0 +1,187 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: jax
2
+ channels:
3
+ - pytorch
4
+ - conda-forge
5
+ - defaults
6
+ dependencies:
7
+ - _libgcc_mutex=0.1=main
8
+ - _openmp_mutex=4.5=1_gnu
9
+ - anyio=3.2.1=py38h578d9bd_0
10
+ - argon2-cffi=20.1.0=py38h497a2fe_2
11
+ - async_generator=1.10=py_0
12
+ - attrs=21.2.0=pyhd8ed1ab_0
13
+ - babel=2.9.1=pyh44b312d_0
14
+ - backcall=0.2.0=pyh9f0ad1d_0
15
+ - backports=1.0=py_2
16
+ - backports.functools_lru_cache=1.6.4=pyhd8ed1ab_0
17
+ - blas=1.0=mkl
18
+ - bleach=3.3.0=pyh44b312d_0
19
+ - brotlipy=0.7.0=py38h497a2fe_1001
20
+ - ca-certificates=2021.5.30=ha878542_0
21
+ - certifi=2021.5.30=py38h578d9bd_0
22
+ - cffi=1.14.5=py38ha65f79e_0
23
+ - chardet=4.0.0=py38h578d9bd_1
24
+ - cryptography=3.4.7=py38ha5dfef3_0
25
+ - cudatoolkit=10.2.89=hfd86e86_1
26
+ - debugpy=1.3.0=py38h709712a_0
27
+ - decorator=5.0.9=pyhd8ed1ab_0
28
+ - defusedxml=0.7.1=pyhd8ed1ab_0
29
+ - entrypoints=0.3=pyhd8ed1ab_1003
30
+ - idna=2.10=pyh9f0ad1d_0
31
+ - importlib-metadata=4.6.1=py38h578d9bd_0
32
+ - intel-openmp=2021.2.0=h06a4308_610
33
+ - ipykernel=6.0.1=py38hd0cf306_0
34
+ - ipython=7.25.0=py38hd0cf306_1
35
+ - ipython_genutils=0.2.0=py_1
36
+ - jedi=0.18.0=py38h578d9bd_2
37
+ - jinja2=3.0.1=pyhd8ed1ab_0
38
+ - json5=0.9.5=pyh9f0ad1d_0
39
+ - jsonschema=3.2.0=pyhd8ed1ab_3
40
+ - jupyter_client=6.1.12=pyhd8ed1ab_0
41
+ - jupyter_core=4.7.1=py38h578d9bd_0
42
+ - jupyter_server=1.9.0=pyhd8ed1ab_0
43
+ - jupyterlab=3.0.16=pyhd8ed1ab_0
44
+ - jupyterlab_pygments=0.1.2=pyh9f0ad1d_0
45
+ - jupyterlab_server=2.6.0=pyhd8ed1ab_0
46
+ - ld_impl_linux-64=2.35.1=h7274673_9
47
+ - libffi=3.3=he6710b0_2
48
+ - libgcc-ng=9.3.0=h5101ec6_17
49
+ - libgomp=9.3.0=h5101ec6_17
50
+ - libsodium=1.0.18=h36c2ea0_1
51
+ - libstdcxx-ng=9.3.0=hd4cf53a_17
52
+ - libuv=1.40.0=h7b6447c_0
53
+ - markupsafe=2.0.1=py38h497a2fe_0
54
+ - matplotlib-inline=0.1.2=pyhd8ed1ab_2
55
+ - mistune=0.8.4=py38h497a2fe_1004
56
+ - mkl=2021.2.0=h06a4308_296
57
+ - nbclassic=0.3.1=pyhd8ed1ab_1
58
+ - nbclient=0.5.3=pyhd8ed1ab_0
59
+ - nbconvert=6.1.0=py38h578d9bd_0
60
+ - nbformat=5.1.3=pyhd8ed1ab_0
61
+ - ncurses=6.2=he6710b0_1
62
+ - nest-asyncio=1.5.1=pyhd8ed1ab_0
63
+ - ninja=1.10.2=hff7bd54_1
64
+ - notebook=6.4.0=pyha770c72_0
65
+ - openssl=1.1.1k=h7f98852_0
66
+ - pandoc=2.14.0.3=h7f98852_0
67
+ - pandocfilters=1.4.2=py_1
68
+ - parso=0.8.2=pyhd8ed1ab_0
69
+ - pexpect=4.8.0=pyh9f0ad1d_2
70
+ - pickleshare=0.7.5=py_1003
71
+ - pip=21.1.3=py38h06a4308_0
72
+ - prometheus_client=0.11.0=pyhd8ed1ab_0
73
+ - prompt-toolkit=3.0.19=pyha770c72_0
74
+ - ptyprocess=0.7.0=pyhd3deb0d_0
75
+ - pycparser=2.20=pyh9f0ad1d_2
76
+ - pygments=2.9.0=pyhd8ed1ab_0
77
+ - pyopenssl=20.0.1=pyhd8ed1ab_0
78
+ - pyparsing=2.4.7=pyh9f0ad1d_0
79
+ - pyrsistent=0.17.3=py38h497a2fe_2
80
+ - pysocks=1.7.1=py38h578d9bd_3
81
+ - python=3.8.10=h12debd9_8
82
+ - python-dateutil=2.8.1=py_0
83
+ - python_abi=3.8=2_cp38
84
+ - pytorch=1.9.0=py3.8_cuda10.2_cudnn7.6.5_0
85
+ - pytz=2021.1=pyhd8ed1ab_0
86
+ - pyzmq=22.1.0=py38h2035c66_0
87
+ - readline=8.1=h27cfd23_0
88
+ - requests=2.25.1=pyhd3deb0d_0
89
+ - requests-unixsocket=0.2.0=py_0
90
+ - send2trash=1.7.1=pyhd8ed1ab_0
91
+ - setuptools=52.0.0=py38h06a4308_0
92
+ - sniffio=1.2.0=py38h578d9bd_1
93
+ - sqlite=3.36.0=hc218d9a_0
94
+ - terminado=0.10.1=py38h578d9bd_0
95
+ - testpath=0.5.0=pyhd8ed1ab_0
96
+ - tk=8.6.10=hbc83047_0
97
+ - tornado=6.1=py38h497a2fe_1
98
+ - traitlets=5.0.5=py_0
99
+ - typing_extensions=3.10.0.0=pyha770c72_0
100
+ - urllib3=1.26.6=pyhd8ed1ab_0
101
+ - wcwidth=0.2.5=pyh9f0ad1d_2
102
+ - webencodings=0.5.1=py_1
103
+ - websocket-client=0.57.0=py38h578d9bd_4
104
+ - wheel=0.36.2=pyhd3eb1b0_0
105
+ - xz=5.2.5=h7b6447c_0
106
+ - zeromq=4.3.4=h9c3ff4c_0
107
+ - zipp=3.5.0=pyhd8ed1ab_0
108
+ - zlib=1.2.11=h7b6447c_3
109
+ - pip:
110
+ - absl-py==0.13.0
111
+ - aiohttp==3.7.4.post0
112
+ - astunparse==1.6.3
113
+ - async-timeout==3.0.1
114
+ - cachetools==4.2.2
115
+ - chex==0.0.8
116
+ - click==8.0.1
117
+ - configparser==5.0.2
118
+ - cycler==0.10.0
119
+ - dill==0.3.4
120
+ - dm-tree==0.1.6
121
+ - docker-pycreds==0.4.0
122
+ - filelock==3.0.12
123
+ - flatbuffers==1.12
124
+ - flax==0.3.4
125
+ - fsspec==2021.6.1
126
+ - gast==0.4.0
127
+ - gitdb==4.0.7
128
+ - gitpython==3.1.18
129
+ - google-auth==1.32.1
130
+ - google-auth-oauthlib==0.4.4
131
+ - google-pasta==0.2.0
132
+ - grpcio==1.34.1
133
+ - h5py==3.1.0
134
+ - huggingface-hub==0.0.12
135
+ - jax==0.2.16
136
+ - jaxlib==0.1.68
137
+ - joblib==1.0.1
138
+ - keras-nightly==2.5.0.dev2021032900
139
+ - keras-preprocessing==1.1.2
140
+ - kiwisolver==1.3.1
141
+ - libtpu-nightly==0.1.dev20210615
142
+ - markdown==3.3.4
143
+ - matplotlib==3.4.2
144
+ - msgpack==1.0.2
145
+ - multidict==5.1.0
146
+ - multiprocess==0.70.12.2
147
+ - numpy==1.19.5
148
+ - oauthlib==3.1.1
149
+ - opt-einsum==3.3.0
150
+ - optax==0.0.9
151
+ - packaging==20.9
152
+ - pandas==1.2.5
153
+ - pathtools==0.1.2
154
+ - pillow==8.3.0
155
+ - promise==2.3
156
+ - protobuf==3.17.3
157
+ - psutil==5.8.0
158
+ - pyarrow==4.0.1
159
+ - pyasn1==0.4.8
160
+ - pyasn1-modules==0.2.8
161
+ - pyyaml==5.4.1
162
+ - regex==2021.7.1
163
+ - requests-oauthlib==1.3.0
164
+ - rsa==4.7.2
165
+ - sacremoses==0.0.45
166
+ - scipy==1.7.0
167
+ - sentry-sdk==1.1.0
168
+ - shortuuid==1.0.1
169
+ - six==1.15.0
170
+ - smmap==4.0.0
171
+ - subprocess32==3.5.4
172
+ - tensorboard==2.5.0
173
+ - tensorboard-data-server==0.6.1
174
+ - tensorboard-plugin-wit==1.8.0
175
+ - tensorflow==2.5.0
176
+ - tensorflow-estimator==2.5.0
177
+ - termcolor==1.1.0
178
+ - tokenizers==0.10.3
179
+ - toolz==0.11.1
180
+ - tqdm==4.61.1
181
+ - typing-extensions==3.7.4.3
182
+ - wandb==0.10.33
183
+ - werkzeug==2.0.1
184
+ - wrapt==1.12.1
185
+ - xxhash==2.0.2
186
+ - yarl==1.6.3
187
+ prefix: /home/cahya/miniconda3/envs/jax
wandb/run-20210709_144100-2k1kyrq2/files/config.yaml ADDED
@@ -0,0 +1,305 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ __cached__setup_devices:
4
+ desc: null
5
+ value: cpu
6
+ _n_gpu:
7
+ desc: null
8
+ value: 0
9
+ _wandb:
10
+ desc: null
11
+ value:
12
+ cli_version: 0.10.33
13
+ framework: huggingface
14
+ huggingface_version: 4.9.0.dev0
15
+ is_jupyter_run: false
16
+ is_kaggle_kernel: false
17
+ python_version: 3.8.10
18
+ t:
19
+ 1:
20
+ - 1
21
+ - 3
22
+ - 11
23
+ 4: 3.8.10
24
+ 5: 0.10.33
25
+ 6: 4.9.0.dev0
26
+ 8:
27
+ - 5
28
+ adafactor:
29
+ desc: null
30
+ value: false
31
+ adam_beta1:
32
+ desc: null
33
+ value: 0.9
34
+ adam_beta2:
35
+ desc: null
36
+ value: 0.98
37
+ adam_epsilon:
38
+ desc: null
39
+ value: 1.0e-08
40
+ block_size:
41
+ desc: null
42
+ value: 512
43
+ cache_dir:
44
+ desc: null
45
+ value: null
46
+ config_name:
47
+ desc: null
48
+ value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
49
+ dataloader_drop_last:
50
+ desc: null
51
+ value: false
52
+ dataloader_num_workers:
53
+ desc: null
54
+ value: 64
55
+ dataloader_pin_memory:
56
+ desc: null
57
+ value: true
58
+ dataset_config_name:
59
+ desc: null
60
+ value: unshuffled_deduplicated_id
61
+ dataset_name:
62
+ desc: null
63
+ value: oscar
64
+ ddp_find_unused_parameters:
65
+ desc: null
66
+ value: null
67
+ debug:
68
+ desc: null
69
+ value: []
70
+ deepspeed:
71
+ desc: null
72
+ value: null
73
+ disable_tqdm:
74
+ desc: null
75
+ value: false
76
+ do_eval:
77
+ desc: null
78
+ value: true
79
+ do_predict:
80
+ desc: null
81
+ value: false
82
+ do_train:
83
+ desc: null
84
+ value: true
85
+ dtype:
86
+ desc: null
87
+ value: float32
88
+ eval_accumulation_steps:
89
+ desc: null
90
+ value: null
91
+ eval_steps:
92
+ desc: null
93
+ value: 5000
94
+ evaluation_strategy:
95
+ desc: null
96
+ value: IntervalStrategy.NO
97
+ fp16:
98
+ desc: null
99
+ value: false
100
+ fp16_backend:
101
+ desc: null
102
+ value: auto
103
+ fp16_full_eval:
104
+ desc: null
105
+ value: false
106
+ fp16_opt_level:
107
+ desc: null
108
+ value: O1
109
+ gradient_accumulation_steps:
110
+ desc: null
111
+ value: 1
112
+ greater_is_better:
113
+ desc: null
114
+ value: null
115
+ group_by_length:
116
+ desc: null
117
+ value: false
118
+ ignore_data_skip:
119
+ desc: null
120
+ value: false
121
+ label_names:
122
+ desc: null
123
+ value: null
124
+ label_smoothing_factor:
125
+ desc: null
126
+ value: 0.0
127
+ learning_rate:
128
+ desc: null
129
+ value: 0.0024
130
+ length_column_name:
131
+ desc: null
132
+ value: length
133
+ load_best_model_at_end:
134
+ desc: null
135
+ value: false
136
+ local_rank:
137
+ desc: null
138
+ value: -1
139
+ log_level:
140
+ desc: null
141
+ value: -1
142
+ log_level_replica:
143
+ desc: null
144
+ value: -1
145
+ log_on_each_node:
146
+ desc: null
147
+ value: true
148
+ logging_dir:
149
+ desc: null
150
+ value: /home/cahya/Work/flax-community/gpt2-medium-indonesian/runs/Jul09_14-41-04_t1v-n-528d9406-w-0
151
+ logging_first_step:
152
+ desc: null
153
+ value: false
154
+ logging_steps:
155
+ desc: null
156
+ value: 5000
157
+ logging_strategy:
158
+ desc: null
159
+ value: IntervalStrategy.STEPS
160
+ lr_scheduler_type:
161
+ desc: null
162
+ value: SchedulerType.LINEAR
163
+ max_eval_samples:
164
+ desc: null
165
+ value: null
166
+ max_grad_norm:
167
+ desc: null
168
+ value: 1.0
169
+ max_steps:
170
+ desc: null
171
+ value: -1
172
+ max_train_samples:
173
+ desc: null
174
+ value: null
175
+ metric_for_best_model:
176
+ desc: null
177
+ value: null
178
+ model_name_or_path:
179
+ desc: null
180
+ value: null
181
+ model_type:
182
+ desc: null
183
+ value: gpt2
184
+ mp_parameters:
185
+ desc: null
186
+ value: ''
187
+ no_cuda:
188
+ desc: null
189
+ value: false
190
+ num_train_epochs:
191
+ desc: null
192
+ value: 20.0
193
+ output_dir:
194
+ desc: null
195
+ value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
196
+ overwrite_cache:
197
+ desc: null
198
+ value: false
199
+ overwrite_output_dir:
200
+ desc: null
201
+ value: true
202
+ past_index:
203
+ desc: null
204
+ value: -1
205
+ per_device_eval_batch_size:
206
+ desc: null
207
+ value: 24
208
+ per_device_train_batch_size:
209
+ desc: null
210
+ value: 24
211
+ per_gpu_eval_batch_size:
212
+ desc: null
213
+ value: null
214
+ per_gpu_train_batch_size:
215
+ desc: null
216
+ value: null
217
+ prediction_loss_only:
218
+ desc: null
219
+ value: false
220
+ preprocessing_num_workers:
221
+ desc: null
222
+ value: 64
223
+ push_to_hub:
224
+ desc: null
225
+ value: true
226
+ push_to_hub_model_id:
227
+ desc: null
228
+ value: gpt2-medium-indonesian
229
+ push_to_hub_organization:
230
+ desc: null
231
+ value: null
232
+ push_to_hub_token:
233
+ desc: null
234
+ value: null
235
+ remove_unused_columns:
236
+ desc: null
237
+ value: true
238
+ report_to:
239
+ desc: null
240
+ value:
241
+ - tensorboard
242
+ - wandb
243
+ resume_from_checkpoint:
244
+ desc: null
245
+ value: null
246
+ run_name:
247
+ desc: null
248
+ value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
249
+ save_on_each_node:
250
+ desc: null
251
+ value: false
252
+ save_steps:
253
+ desc: null
254
+ value: 5000
255
+ save_strategy:
256
+ desc: null
257
+ value: IntervalStrategy.STEPS
258
+ save_total_limit:
259
+ desc: null
260
+ value: null
261
+ seed:
262
+ desc: null
263
+ value: 42
264
+ sharded_ddp:
265
+ desc: null
266
+ value: []
267
+ skip_memory_metrics:
268
+ desc: null
269
+ value: true
270
+ test_log:
271
+ desc: null
272
+ value: 12345
273
+ tokenizer_name:
274
+ desc: null
275
+ value: /home/cahya/Work/flax-community/gpt2-medium-indonesian
276
+ tpu_metrics_debug:
277
+ desc: null
278
+ value: false
279
+ tpu_num_cores:
280
+ desc: null
281
+ value: null
282
+ train_file:
283
+ desc: null
284
+ value: null
285
+ use_fast_tokenizer:
286
+ desc: null
287
+ value: true
288
+ use_legacy_prediction_loop:
289
+ desc: null
290
+ value: false
291
+ validation_file:
292
+ desc: null
293
+ value: null
294
+ validation_split_percentage:
295
+ desc: null
296
+ value: 2
297
+ warmup_ratio:
298
+ desc: null
299
+ value: 0.0
300
+ warmup_steps:
301
+ desc: null
302
+ value: 1000
303
+ weight_decay:
304
+ desc: null
305
+ value: 0.01
wandb/run-20210709_144100-2k1kyrq2/files/events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2 ADDED
@@ -0,0 +1 @@
 
 
1
+ /home/cahya/Work/flax-community/gpt2-medium-indonesian/events.out.tfevents.1625843003.t1v-n-528d9406-w-0.250031.3.v2
wandb/run-20210709_144100-2k1kyrq2/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20210709_144100-2k1kyrq2/files/requirements.txt ADDED
@@ -0,0 +1,153 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ absl-py==0.13.0
2
+ aiohttp==3.7.4.post0
3
+ anyio==3.2.1
4
+ argon2-cffi==20.1.0
5
+ astunparse==1.6.3
6
+ async-generator==1.10
7
+ async-timeout==3.0.1
8
+ attrs==21.2.0
9
+ babel==2.9.1
10
+ backcall==0.2.0
11
+ backports.functools-lru-cache==1.6.4
12
+ bleach==3.3.0
13
+ brotlipy==0.7.0
14
+ cachetools==4.2.2
15
+ certifi==2021.5.30
16
+ cffi==1.14.5
17
+ chardet==4.0.0
18
+ chex==0.0.8
19
+ click==8.0.1
20
+ configparser==5.0.2
21
+ cryptography==3.4.7
22
+ cycler==0.10.0
23
+ datasets==1.8.1.dev0
24
+ debugpy==1.3.0
25
+ decorator==5.0.9
26
+ defusedxml==0.7.1
27
+ dill==0.3.4
28
+ dm-tree==0.1.6
29
+ docker-pycreds==0.4.0
30
+ entrypoints==0.3
31
+ filelock==3.0.12
32
+ flatbuffers==1.12
33
+ flax==0.3.4
34
+ fsspec==2021.6.1
35
+ gast==0.4.0
36
+ gitdb==4.0.7
37
+ gitpython==3.1.18
38
+ google-auth-oauthlib==0.4.4
39
+ google-auth==1.32.1
40
+ google-pasta==0.2.0
41
+ grpcio==1.34.1
42
+ h5py==3.1.0
43
+ huggingface-hub==0.0.12
44
+ idna==2.10
45
+ importlib-metadata==4.6.1
46
+ ipykernel==6.0.1
47
+ ipython-genutils==0.2.0
48
+ ipython==7.25.0
49
+ jax==0.2.16
50
+ jaxlib==0.1.68
51
+ jedi==0.18.0
52
+ jinja2==3.0.1
53
+ joblib==1.0.1
54
+ json5==0.9.5
55
+ jsonschema==3.2.0
56
+ jupyter-client==6.1.12
57
+ jupyter-core==4.7.1
58
+ jupyter-server==1.9.0
59
+ jupyterlab-pygments==0.1.2
60
+ jupyterlab-server==2.6.0
61
+ jupyterlab==3.0.16
62
+ keras-nightly==2.5.0.dev2021032900
63
+ keras-preprocessing==1.1.2
64
+ kiwisolver==1.3.1
65
+ libtpu-nightly==0.1.dev20210615
66
+ markdown==3.3.4
67
+ markupsafe==2.0.1
68
+ matplotlib-inline==0.1.2
69
+ matplotlib==3.4.2
70
+ mistune==0.8.4
71
+ msgpack==1.0.2
72
+ multidict==5.1.0
73
+ multiprocess==0.70.12.2
74
+ nbclassic==0.3.1
75
+ nbclient==0.5.3
76
+ nbconvert==6.1.0
77
+ nbformat==5.1.3
78
+ nest-asyncio==1.5.1
79
+ notebook==6.4.0
80
+ numpy==1.19.5
81
+ oauthlib==3.1.1
82
+ opt-einsum==3.3.0
83
+ optax==0.0.9
84
+ packaging==21.0
85
+ pandas==1.2.5
86
+ pandocfilters==1.4.2
87
+ parso==0.8.2
88
+ pathtools==0.1.2
89
+ pexpect==4.8.0
90
+ pickleshare==0.7.5
91
+ pillow==8.3.0
92
+ pip==21.1.3
93
+ prometheus-client==0.11.0
94
+ promise==2.3
95
+ prompt-toolkit==3.0.19
96
+ protobuf==3.17.3
97
+ psutil==5.8.0
98
+ ptyprocess==0.7.0
99
+ pyarrow==4.0.1
100
+ pyasn1-modules==0.2.8
101
+ pyasn1==0.4.8
102
+ pycparser==2.20
103
+ pygments==2.9.0
104
+ pyopenssl==20.0.1
105
+ pyparsing==2.4.7
106
+ pyrsistent==0.17.3
107
+ pysocks==1.7.1
108
+ python-dateutil==2.8.1
109
+ pytz==2021.1
110
+ pyyaml==5.4.1
111
+ pyzmq==22.1.0
112
+ regex==2021.7.1
113
+ requests-oauthlib==1.3.0
114
+ requests-unixsocket==0.2.0
115
+ requests==2.25.1
116
+ rsa==4.7.2
117
+ sacremoses==0.0.45
118
+ scipy==1.7.0
119
+ send2trash==1.7.1
120
+ sentry-sdk==1.1.0
121
+ setuptools==52.0.0.post20210125
122
+ shortuuid==1.0.1
123
+ six==1.16.0
124
+ smmap==4.0.0
125
+ sniffio==1.2.0
126
+ subprocess32==3.5.4
127
+ tensorboard-data-server==0.6.1
128
+ tensorboard-plugin-wit==1.8.0
129
+ tensorboard==2.5.0
130
+ tensorflow-estimator==2.5.0
131
+ tensorflow==2.5.0
132
+ termcolor==1.1.0
133
+ terminado==0.10.1
134
+ testpath==0.5.0
135
+ tokenizers==0.10.3
136
+ toolz==0.11.1
137
+ torch==1.9.0
138
+ tornado==6.1
139
+ tqdm==4.61.1
140
+ traitlets==5.0.5
141
+ transformers==4.9.0.dev0
142
+ typing-extensions==3.10.0.0
143
+ urllib3==1.26.6
144
+ wandb==0.10.33
145
+ wcwidth==0.2.5
146
+ webencodings==0.5.1
147
+ websocket-client==0.57.0
148
+ werkzeug==2.0.1
149
+ wheel==0.36.2
150
+ wrapt==1.12.1
151
+ xxhash==2.0.2
152
+ yarl==1.6.3
153
+ zipp==3.5.0
wandb/run-20210709_144100-2k1kyrq2/files/wandb-metadata.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.4.0-1043-gcp-x86_64-with-glibc2.17",
3
+ "python": "3.8.10",
4
+ "heartbeatAt": "2021-07-09T14:41:02.325218",
5
+ "startedAt": "2021-07-09T14:41:00.270917",
6
+ "docker": null,
7
+ "cpu_count": 96,
8
+ "cuda": null,
9
+ "args": [
10
+ "--output_dir=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
11
+ "--model_type=gpt2",
12
+ "--config_name=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
13
+ "--tokenizer_name=/home/cahya/Work/flax-community/gpt2-medium-indonesian",
14
+ "--dataset_name=oscar",
15
+ "--dataset_config_name=unshuffled_deduplicated_id",
16
+ "--do_train",
17
+ "--do_eval",
18
+ "--block_size=512",
19
+ "--per_device_train_batch_size=24",
20
+ "--per_device_eval_batch_size=24",
21
+ "--learning_rate=0.0024",
22
+ "--warmup_steps=1000",
23
+ "--adam_beta1=0.9",
24
+ "--adam_beta2=0.98",
25
+ "--weight_decay=0.01",
26
+ "--overwrite_output_dir",
27
+ "--num_train_epochs=20",
28
+ "--dataloader_num_workers=64",
29
+ "--preprocessing_num_workers=64",
30
+ "--logging_steps=5000",
31
+ "--save_steps=5000",
32
+ "--eval_steps=5000",
33
+ "--validation_split_percentage=2",
34
+ "--push_to_hub"
35
+ ],
36
+ "state": "running",
37
+ "program": "./run_clm_flax.py",
38
+ "codePath": "run_clm_flax.py",
39
+ "git": {
40
+ "remote": "https://huggingface.co/flax-community/gpt2-medium-indonesian",
41
+ "commit": "9b9473462e797993d7ca4cfb92daa71c0bc81e9d"
42
+ },
43
+ "email": "[email protected]",
44
+ "root": "/home/cahya/Work/flax-community/gpt2-medium-indonesian",
45
+ "host": "t1v-n-528d9406-w-0",
46
+ "username": "cahya",
47
+ "executable": "/home/cahya/miniconda3/envs/jax/bin/python"
48
+ }
wandb/run-20210709_144100-2k1kyrq2/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"global_step": 5000, "_timestamp": 1625848638.071834, "train_time": 5622.2197265625, "train_learning_rate": 0.00238410709425807, "_step": 9997, "train_loss": 3.5673484802246094}
wandb/run-20210709_144100-2k1kyrq2/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20210709_144100-2k1kyrq2/logs/debug.log ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] Unhandled environment var: WANDB_LOG_MODEL
2
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] setting env: {'project': 'hf-flax-gpt2-indonesian', 'entity': 'wandb'}
3
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_setup.py:_flush():69] setting login settings: {}
4
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:_log_setup():337] Logging user logs to /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_144100-2k1kyrq2/logs/debug.log
5
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:_log_setup():338] Logging internal logs to /home/cahya/Work/flax-community/gpt2-medium-indonesian/wandb/run-20210709_144100-2k1kyrq2/logs/debug-internal.log
6
+ 2021-07-09 14:41:00,272 INFO MainThread:250031 [wandb_init.py:init():370] calling init triggers
7
+ 2021-07-09 14:41:00,273 INFO MainThread:250031 [wandb_init.py:init():375] wandb.init called with sweep_config: {}
8
+ config: {}
9
+ 2021-07-09 14:41:00,273 INFO MainThread:250031 [wandb_init.py:init():419] starting backend
10
+ 2021-07-09 14:41:00,273 INFO MainThread:250031 [backend.py:_multiprocessing_setup():70] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
11
+ 2021-07-09 14:41:00,314 INFO MainThread:250031 [backend.py:ensure_launched():135] starting backend process...
12
+ 2021-07-09 14:41:00,353 INFO MainThread:250031 [backend.py:ensure_launched():139] started backend process with pid: 251111
13
+ 2021-07-09 14:41:00,355 INFO MainThread:250031 [wandb_init.py:init():424] backend started and connected
14
+ 2021-07-09 14:41:00,357 INFO MainThread:250031 [wandb_init.py:init():472] updated telemetry
15
+ 2021-07-09 14:41:00,358 INFO MainThread:250031 [wandb_init.py:init():491] communicating current version
16
+ 2021-07-09 14:41:01,006 INFO MainThread:250031 [wandb_init.py:init():496] got version response
17
+ 2021-07-09 14:41:01,006 INFO MainThread:250031 [wandb_init.py:init():504] communicating run to backend with 30 second timeout
18
+ 2021-07-09 14:41:01,184 INFO MainThread:250031 [wandb_init.py:init():529] starting run threads in backend
19
+ 2021-07-09 14:41:04,780 INFO MainThread:250031 [wandb_run.py:_console_start():1623] atexit reg
20
+ 2021-07-09 14:41:04,781 INFO MainThread:250031 [wandb_run.py:_redirect():1497] redirect: SettingsConsole.REDIRECT
21
+ 2021-07-09 14:41:04,782 INFO MainThread:250031 [wandb_run.py:_redirect():1502] Redirecting console.
22
+ 2021-07-09 14:41:04,783 INFO MainThread:250031 [wandb_run.py:_redirect():1558] Redirects installed.
23
+ 2021-07-09 14:41:04,784 INFO MainThread:250031 [wandb_init.py:init():554] run started, returning control to user process
24
+ 2021-07-09 14:41:04,793 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'output_dir': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'IntervalStrategy.NO', 'prediction_loss_only': False, 'per_device_train_batch_size': 24, 'per_device_eval_batch_size': 24, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'learning_rate': 0.0024, 'weight_decay': 0.01, 'adam_beta1': 0.9, 'adam_beta2': 0.98, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 20.0, 'max_steps': -1, 'lr_scheduler_type': 'SchedulerType.LINEAR', 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': '/home/cahya/Work/flax-community/gpt2-medium-indonesian/runs/Jul09_14-41-04_t1v-n-528d9406-w-0', 'logging_strategy': 'IntervalStrategy.STEPS', 'logging_first_step': False, 'logging_steps': 5000, 'save_strategy': 'IntervalStrategy.STEPS', 'save_steps': 5000, 'save_total_limit': None, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'fp16': False, 'fp16_opt_level': 'O1', 'fp16_backend': 'auto', 'fp16_full_eval': False, 'local_rank': -1, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 5000, 'dataloader_num_workers': 64, 'past_index': -1, 'run_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'sharded_ddp': [], 'deepspeed': None, 'label_smoothing_factor': 0.0, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'push_to_hub_model_id': 'gpt2-medium-indonesian', 'push_to_hub_organization': None, 'push_to_hub_token': None, 'mp_parameters': '', '_n_gpu': 0, '__cached__setup_devices': 'cpu'}
25
+ 2021-07-09 14:41:04,794 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'model_name_or_path': None, 'model_type': 'gpt2', 'config_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'tokenizer_name': '/home/cahya/Work/flax-community/gpt2-medium-indonesian', 'cache_dir': None, 'use_fast_tokenizer': True, 'dtype': 'float32'}
26
+ 2021-07-09 14:41:04,794 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb None None {'dataset_name': 'oscar', 'dataset_config_name': 'unshuffled_deduplicated_id', 'train_file': None, 'validation_file': None, 'max_train_samples': None, 'max_eval_samples': None, 'overwrite_cache': False, 'validation_split_percentage': 2, 'block_size': 512, 'preprocessing_num_workers': 64}
27
+ 2021-07-09 14:41:04,795 INFO MainThread:250031 [wandb_config.py:__setitem__():141] config set test_log = 12345 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f3836ca5a90>>
28
+ 2021-07-09 14:41:04,795 INFO MainThread:250031 [wandb_run.py:_config_callback():872] config_cb test_log 12345 None
29
+ 2021-07-09 15:03:23,473 INFO MainThread:250031 [wandb_run.py:_tensorboard_callback():943] tensorboard callback: /home/cahya/Work/flax-community/gpt2-medium-indonesian, None
wandb/run-20210709_144100-2k1kyrq2/run-2k1kyrq2.wandb ADDED
Binary file (1.4 MB). View file