pierreguillou
commited on
Commit
β’
4e02099
1
Parent(s):
a5ec683
Training in progress, step 10500
Browse files- {checkpoint-9000 β checkpoint-10000}/config.json +0 -0
- {checkpoint-9000 β checkpoint-10000}/optimizer.pt +1 -1
- {checkpoint-9500 β checkpoint-10000}/pytorch_model.bin +1 -1
- {checkpoint-9500 β checkpoint-10000}/rng_state.pth +1 -1
- {checkpoint-9500 β checkpoint-10000}/scaler.pt +1 -1
- {checkpoint-9000 β checkpoint-10000}/scheduler.pt +1 -1
- {checkpoint-9000 β checkpoint-10000}/special_tokens_map.json +0 -0
- {checkpoint-9000 β checkpoint-10000}/tokenizer.json +0 -0
- {checkpoint-9000 β checkpoint-10000}/tokenizer_config.json +0 -0
- {checkpoint-9500 β checkpoint-10000}/trainer_state.json +21 -3
- {checkpoint-9000 β checkpoint-10000}/training_args.bin +0 -0
- {checkpoint-9500 β checkpoint-10500}/config.json +0 -0
- {checkpoint-9500 β checkpoint-10500}/optimizer.pt +1 -1
- {checkpoint-9000 β checkpoint-10500}/pytorch_model.bin +1 -1
- {checkpoint-9000 β checkpoint-10500}/rng_state.pth +1 -1
- {checkpoint-9000 β checkpoint-10500}/scaler.pt +1 -1
- {checkpoint-9500 β checkpoint-10500}/scheduler.pt +1 -1
- {checkpoint-9500 β checkpoint-10500}/special_tokens_map.json +0 -0
- {checkpoint-9500 β checkpoint-10500}/tokenizer.json +0 -0
- {checkpoint-9500 β checkpoint-10500}/tokenizer_config.json +0 -0
- {checkpoint-9000 β checkpoint-10500}/trainer_state.json +57 -3
- {checkpoint-9500 β checkpoint-10500}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-9000 β checkpoint-10000}/config.json
RENAMED
File without changes
|
{checkpoint-9000 β checkpoint-10000}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d284277e529a50e3e8bb5292a6ded11322ad1fc7a52ec65935b405cb7662695
|
3 |
size 2265828101
|
{checkpoint-9500 β checkpoint-10000}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9cdd3999fd22f100fd94dce143c740e69b3c530d00c63fa0da503c17bada7be
|
3 |
size 1134425553
|
{checkpoint-9500 β checkpoint-10000}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cabb7b3cf7014541a06db66ed776280360aa7ac5090dfa97d8fd96cf3ffc0723
|
3 |
size 14575
|
{checkpoint-9500 β checkpoint-10000}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33042e23a1c163afce06998300e1af98d04bb036d7a9fc004dc4fc5115c37477
|
3 |
size 557
|
{checkpoint-9000 β checkpoint-10000}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c34c3aa5eb00aba6650e668fcf350c18b296ed27ff6b939de04b85351858f303
|
3 |
size 627
|
{checkpoint-9000 β checkpoint-10000}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-9000 β checkpoint-10000}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-9000 β checkpoint-10000}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-9500 β checkpoint-10000}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 0.8849383152916955,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -348,11 +348,29 @@
|
|
348 |
"eval_samples_per_second": 60.557,
|
349 |
"eval_steps_per_second": 3.807,
|
350 |
"step": 9500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
351 |
}
|
352 |
],
|
353 |
"max_steps": 12035,
|
354 |
"num_train_epochs": 5,
|
355 |
-
"total_flos": 1.
|
356 |
"trial_name": null,
|
357 |
"trial_params": null
|
358 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 0.8849383152916955,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
4 |
+
"epoch": 4.154549231408392,
|
5 |
+
"global_step": 10000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
348 |
"eval_samples_per_second": 60.557,
|
349 |
"eval_steps_per_second": 3.807,
|
350 |
"step": 9500
|
351 |
+
},
|
352 |
+
{
|
353 |
+
"epoch": 4.15,
|
354 |
+
"learning_rate": 8.483589530535937e-06,
|
355 |
+
"loss": 0.0464,
|
356 |
+
"step": 10000
|
357 |
+
},
|
358 |
+
{
|
359 |
+
"epoch": 4.15,
|
360 |
+
"eval_accuracy": 0.8510961702401442,
|
361 |
+
"eval_f1": 0.8510961702401442,
|
362 |
+
"eval_loss": 1.0767754316329956,
|
363 |
+
"eval_precision": 0.8510961702401442,
|
364 |
+
"eval_recall": 0.8510961702401442,
|
365 |
+
"eval_runtime": 38.7314,
|
366 |
+
"eval_samples_per_second": 52.98,
|
367 |
+
"eval_steps_per_second": 3.331,
|
368 |
+
"step": 10000
|
369 |
}
|
370 |
],
|
371 |
"max_steps": 12035,
|
372 |
"num_train_epochs": 5,
|
373 |
+
"total_flos": 1.6684492713864192e+16,
|
374 |
"trial_name": null,
|
375 |
"trial_params": null
|
376 |
}
|
{checkpoint-9000 β checkpoint-10000}/training_args.bin
RENAMED
File without changes
|
{checkpoint-9500 β checkpoint-10500}/config.json
RENAMED
File without changes
|
{checkpoint-9500 β checkpoint-10500}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f73f8178eb8edf00ed5b572bab08ed8dc9a6b9f127b9da0845ce6897121f30d4
|
3 |
size 2265828101
|
{checkpoint-9000 β checkpoint-10500}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ded9cb2eeea21506721e8c61ffb8b582933f1daa41565103186b7c1e36b4c34
|
3 |
size 1134425553
|
{checkpoint-9000 β checkpoint-10500}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71d4bb3c3265e07b1b570a635f165856008288f9ef44970f54c27bda7a78510a
|
3 |
size 14575
|
{checkpoint-9000 β checkpoint-10500}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0189e6a21dbc7825032487f150c86eee8abb079d598cf29704ea468feba66754
|
3 |
size 557
|
{checkpoint-9500 β checkpoint-10500}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bc651b3c4e5c2b5a130baba8a17171ec720b664d0099fc5a91625bbe706a9d8
|
3 |
size 627
|
{checkpoint-9500 β checkpoint-10500}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-9500 β checkpoint-10500}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-9500 β checkpoint-10500}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-9000 β checkpoint-10500}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 0.8849383152916955,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -330,11 +330,65 @@
|
|
330 |
"eval_samples_per_second": 51.672,
|
331 |
"eval_steps_per_second": 3.248,
|
332 |
"step": 9000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
333 |
}
|
334 |
],
|
335 |
"max_steps": 12035,
|
336 |
"num_train_epochs": 5,
|
337 |
-
"total_flos": 1.
|
338 |
"trial_name": null,
|
339 |
"trial_params": null
|
340 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 0.8849383152916955,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
4 |
+
"epoch": 4.362276692978812,
|
5 |
+
"global_step": 10500,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
330 |
"eval_samples_per_second": 51.672,
|
331 |
"eval_steps_per_second": 3.248,
|
332 |
"step": 9000
|
333 |
+
},
|
334 |
+
{
|
335 |
+
"epoch": 3.95,
|
336 |
+
"learning_rate": 1.0560864146240134e-05,
|
337 |
+
"loss": 0.0639,
|
338 |
+
"step": 9500
|
339 |
+
},
|
340 |
+
{
|
341 |
+
"epoch": 3.95,
|
342 |
+
"eval_accuracy": 0.8585272876421483,
|
343 |
+
"eval_f1": 0.8585272876421483,
|
344 |
+
"eval_loss": 0.9562506079673767,
|
345 |
+
"eval_precision": 0.8585272876421483,
|
346 |
+
"eval_recall": 0.8585272876421483,
|
347 |
+
"eval_runtime": 33.8854,
|
348 |
+
"eval_samples_per_second": 60.557,
|
349 |
+
"eval_steps_per_second": 3.807,
|
350 |
+
"step": 9500
|
351 |
+
},
|
352 |
+
{
|
353 |
+
"epoch": 4.15,
|
354 |
+
"learning_rate": 8.483589530535937e-06,
|
355 |
+
"loss": 0.0464,
|
356 |
+
"step": 10000
|
357 |
+
},
|
358 |
+
{
|
359 |
+
"epoch": 4.15,
|
360 |
+
"eval_accuracy": 0.8510961702401442,
|
361 |
+
"eval_f1": 0.8510961702401442,
|
362 |
+
"eval_loss": 1.0767754316329956,
|
363 |
+
"eval_precision": 0.8510961702401442,
|
364 |
+
"eval_recall": 0.8510961702401442,
|
365 |
+
"eval_runtime": 38.7314,
|
366 |
+
"eval_samples_per_second": 52.98,
|
367 |
+
"eval_steps_per_second": 3.331,
|
368 |
+
"step": 10000
|
369 |
+
},
|
370 |
+
{
|
371 |
+
"epoch": 4.36,
|
372 |
+
"learning_rate": 6.406314914831742e-06,
|
373 |
+
"loss": 0.0412,
|
374 |
+
"step": 10500
|
375 |
+
},
|
376 |
+
{
|
377 |
+
"epoch": 4.36,
|
378 |
+
"eval_accuracy": 0.8439143652185103,
|
379 |
+
"eval_f1": 0.8439143652185103,
|
380 |
+
"eval_loss": 1.1184284687042236,
|
381 |
+
"eval_precision": 0.8439143652185103,
|
382 |
+
"eval_recall": 0.8439143652185103,
|
383 |
+
"eval_runtime": 34.8108,
|
384 |
+
"eval_samples_per_second": 58.947,
|
385 |
+
"eval_steps_per_second": 3.706,
|
386 |
+
"step": 10500
|
387 |
}
|
388 |
],
|
389 |
"max_steps": 12035,
|
390 |
"num_train_epochs": 5,
|
391 |
+
"total_flos": 1.7519009430408192e+16,
|
392 |
"trial_name": null,
|
393 |
"trial_params": null
|
394 |
}
|
{checkpoint-9500 β checkpoint-10500}/training_args.bin
RENAMED
File without changes
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ded9cb2eeea21506721e8c61ffb8b582933f1daa41565103186b7c1e36b4c34
|
3 |
size 1134425553
|
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd243e364357934c6c9869396572a0adcc90607302d0df94af11534a3f187cd2
|
3 |
+
size 17838
|