Training in progress, step 500
Browse files- .gitignore +1 -0
- config.json +41 -0
- log/1685756631.7457728/events.out.tfevents.1685756631.a4bd701242e7.1463.1 +3 -0
- log/1685756655.802506/events.out.tfevents.1685756655.a4bd701242e7.1463.3 +3 -0
- log/1685756682.4642992/events.out.tfevents.1685756682.a4bd701242e7.1463.5 +3 -0
- log/1685756820.2901652/events.out.tfevents.1685756820.a4bd701242e7.1463.7 +3 -0
- log/1685756968.7793558/events.out.tfevents.1685756968.a4bd701242e7.1463.9 +3 -0
- log/1685757339.4243653/events.out.tfevents.1685757339.a4bd701242e7.1463.11 +3 -0
- log/1685757426.9349952/events.out.tfevents.1685757426.a4bd701242e7.1463.13 +3 -0
- log/1685757599.0818408/events.out.tfevents.1685757599.a4bd701242e7.1463.15 +3 -0
- log/1685757697.210757/events.out.tfevents.1685757697.a4bd701242e7.1463.17 +3 -0
- log/1685757918.260184/events.out.tfevents.1685757918.a4bd701242e7.1463.19 +3 -0
- log/1685758028.454992/events.out.tfevents.1685758028.a4bd701242e7.1463.20 +3 -0
- log/1685758037.5097477/events.out.tfevents.1685758037.a4bd701242e7.1463.22 +3 -0
- log/1685758042.344527/events.out.tfevents.1685758042.a4bd701242e7.1463.23 +3 -0
- log/1685758300.7219527/events.out.tfevents.1685758300.a4bd701242e7.1463.25 +3 -0
- log/1685758440.5740914/events.out.tfevents.1685758440.a4bd701242e7.1463.27 +3 -0
- log/1685762856.0185945/events.out.tfevents.1685762856.a4bd701242e7.1463.29 +3 -0
- log/1685762999.8144422/events.out.tfevents.1685762999.a4bd701242e7.1463.31 +3 -0
- log/1685763165.374101/events.out.tfevents.1685763165.a4bd701242e7.1463.33 +3 -0
- log/events.out.tfevents.1685756631.a4bd701242e7.1463.0 +3 -0
- log/events.out.tfevents.1685756655.a4bd701242e7.1463.2 +3 -0
- log/events.out.tfevents.1685756682.a4bd701242e7.1463.4 +3 -0
- log/events.out.tfevents.1685756820.a4bd701242e7.1463.6 +3 -0
- log/events.out.tfevents.1685756968.a4bd701242e7.1463.8 +3 -0
- log/events.out.tfevents.1685757339.a4bd701242e7.1463.10 +3 -0
- log/events.out.tfevents.1685757426.a4bd701242e7.1463.12 +3 -0
- log/events.out.tfevents.1685757599.a4bd701242e7.1463.14 +3 -0
- log/events.out.tfevents.1685757697.a4bd701242e7.1463.16 +3 -0
- log/events.out.tfevents.1685757918.a4bd701242e7.1463.18 +3 -0
- log/events.out.tfevents.1685758037.a4bd701242e7.1463.21 +3 -0
- log/events.out.tfevents.1685758300.a4bd701242e7.1463.24 +3 -0
- log/events.out.tfevents.1685758440.a4bd701242e7.1463.26 +3 -0
- log/events.out.tfevents.1685762856.a4bd701242e7.1463.28 +3 -0
- log/events.out.tfevents.1685762999.a4bd701242e7.1463.30 +3 -0
- log/events.out.tfevents.1685763165.a4bd701242e7.1463.32 +3 -0
- merges.txt +0 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +23 -0
- tokenizer_config.json +33 -0
- training_args.bin +3 -0
- vocab.json +0 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "gpt2-medium",
|
3 |
+
"activation_function": "gelu_new",
|
4 |
+
"architectures": [
|
5 |
+
"GPT2LMHeadModel"
|
6 |
+
],
|
7 |
+
"attn_pdrop": 0.1,
|
8 |
+
"bos_token_id": 50256,
|
9 |
+
"embd_pdrop": 0.1,
|
10 |
+
"eos_token_id": 50256,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"layer_norm_epsilon": 1e-05,
|
13 |
+
"model_type": "gpt2",
|
14 |
+
"n_ctx": 1024,
|
15 |
+
"n_embd": 1024,
|
16 |
+
"n_head": 16,
|
17 |
+
"n_inner": null,
|
18 |
+
"n_layer": 24,
|
19 |
+
"n_positions": 1024,
|
20 |
+
"n_special": 0,
|
21 |
+
"predict_special_tokens": true,
|
22 |
+
"reorder_and_upcast_attn": false,
|
23 |
+
"resid_pdrop": 0.1,
|
24 |
+
"scale_attn_by_inverse_layer_idx": false,
|
25 |
+
"scale_attn_weights": true,
|
26 |
+
"summary_activation": null,
|
27 |
+
"summary_first_dropout": 0.1,
|
28 |
+
"summary_proj_to_labels": true,
|
29 |
+
"summary_type": "cls_index",
|
30 |
+
"summary_use_proj": true,
|
31 |
+
"task_specific_params": {
|
32 |
+
"text-generation": {
|
33 |
+
"do_sample": true,
|
34 |
+
"max_length": 50
|
35 |
+
}
|
36 |
+
},
|
37 |
+
"torch_dtype": "float16",
|
38 |
+
"transformers_version": "4.29.2",
|
39 |
+
"use_cache": true,
|
40 |
+
"vocab_size": 50257
|
41 |
+
}
|
log/1685756631.7457728/events.out.tfevents.1685756631.a4bd701242e7.1463.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0a73d5f897136779c4549ac7a2ebaa340f9b5459afc07d3dc0505ae8c9a099d
|
3 |
+
size 5879
|
log/1685756655.802506/events.out.tfevents.1685756655.a4bd701242e7.1463.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf7504ecb232d53ed1485ca976f5fdb2a375146bc010be8ffc2590e1f1fbadd1
|
3 |
+
size 5879
|
log/1685756682.4642992/events.out.tfevents.1685756682.a4bd701242e7.1463.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4812f63b075ff3805ce893828f813a887565cf686209ec0e2ce81525d49a8bd3
|
3 |
+
size 5879
|
log/1685756820.2901652/events.out.tfevents.1685756820.a4bd701242e7.1463.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484b33a788de078068087ed41388b1b756cefb762e266bf5b25a63c0b967778b
|
3 |
+
size 5879
|
log/1685756968.7793558/events.out.tfevents.1685756968.a4bd701242e7.1463.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c673594f716a7e8316b9f2902f2a11ac2ef52da628b1379275add912dfdcd08
|
3 |
+
size 5879
|
log/1685757339.4243653/events.out.tfevents.1685757339.a4bd701242e7.1463.11
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:920be2ceef0c0345bf468fc92d6c9584d80469f6077b2e089dcca58a6656010a
|
3 |
+
size 5879
|
log/1685757426.9349952/events.out.tfevents.1685757426.a4bd701242e7.1463.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6dd4c39048cea6cd6c29465f24c89003684021c477166f13ed2ccfc272496d1
|
3 |
+
size 5879
|
log/1685757599.0818408/events.out.tfevents.1685757599.a4bd701242e7.1463.15
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fff3eebd9050636a73a675b66d475625d09156eab320b599f3973baa47803226
|
3 |
+
size 5879
|
log/1685757697.210757/events.out.tfevents.1685757697.a4bd701242e7.1463.17
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6147ecf344b52c74559b6ddadebb81102c436e36b0dfb6d3d0ee8a6f468b57b9
|
3 |
+
size 5879
|
log/1685757918.260184/events.out.tfevents.1685757918.a4bd701242e7.1463.19
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2db3b327f6813c2cbd7ca0abb45a7bfd5b00665f263f7ad509dbe63de9f116bf
|
3 |
+
size 5879
|
log/1685758028.454992/events.out.tfevents.1685758028.a4bd701242e7.1463.20
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d41e3cadad8fce9d4c96e6842cf94ae8e7fde599c3f8baa5843a8e9bf39a58d
|
3 |
+
size 5879
|
log/1685758037.5097477/events.out.tfevents.1685758037.a4bd701242e7.1463.22
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17fdf71d6b145fb81dd4ec1aebd6f1fa095dcc5bf2e8a1bef7cc3b9e3987e497
|
3 |
+
size 5879
|
log/1685758042.344527/events.out.tfevents.1685758042.a4bd701242e7.1463.23
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bb6eca5b956a6831c5ca613b5b9f0da5f8f79321a0ca159accfebcd668e9ba7
|
3 |
+
size 5879
|
log/1685758300.7219527/events.out.tfevents.1685758300.a4bd701242e7.1463.25
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a09d28dd9d67d8bc24686d027e64d2b42498b5eada7aeb701ca0175a9bb3a7b
|
3 |
+
size 5879
|
log/1685758440.5740914/events.out.tfevents.1685758440.a4bd701242e7.1463.27
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d731ecf97991c73be2fc914726dcb228b499e6d06de261e95382f6ae905d240
|
3 |
+
size 5879
|
log/1685762856.0185945/events.out.tfevents.1685762856.a4bd701242e7.1463.29
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cece652662c9393137ff18427abb39dacfd78c25721ceeff16a7a0cf7fc93ac0
|
3 |
+
size 5879
|
log/1685762999.8144422/events.out.tfevents.1685762999.a4bd701242e7.1463.31
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f91ebe5af3723f28bfbdc78f46bd569431cdbe69c43c1442bb6717285687a9a
|
3 |
+
size 5879
|
log/1685763165.374101/events.out.tfevents.1685763165.a4bd701242e7.1463.33
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d0c9a11b3eb1b456696d0b2af395a6b7646c6ec6df12d9482aca7be78884f28
|
3 |
+
size 5875
|
log/events.out.tfevents.1685756631.a4bd701242e7.1463.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e64886843809c84fd6b59f3628b4b6c8a0fd29c0ca0ddcd03bbb12a783f0ee
|
3 |
+
size 4224
|
log/events.out.tfevents.1685756655.a4bd701242e7.1463.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:819599f7f845d6e65f98458cc6fe112c2dd308b3c3655097f71cedc5ff4ceb36
|
3 |
+
size 4224
|
log/events.out.tfevents.1685756682.a4bd701242e7.1463.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:708a1005dfa8cb26f68fc2b54f5c98a0dfca9dcb51959381318e5cca20b98e8c
|
3 |
+
size 4224
|
log/events.out.tfevents.1685756820.a4bd701242e7.1463.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1619e62a11d0604b6e8b5bffa8748312ac03de1bf1ea2257979c55285966ccf0
|
3 |
+
size 4225
|
log/events.out.tfevents.1685756968.a4bd701242e7.1463.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4425fa3c77b774fbbb2080b1c4cc11554f24297c7961b3e91c866c004b7c70b4
|
3 |
+
size 4225
|
log/events.out.tfevents.1685757339.a4bd701242e7.1463.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3552ed87d9b4d32bf66dea8cc956722b51f5c0db462c13c0c990479d7b1b21ac
|
3 |
+
size 4225
|
log/events.out.tfevents.1685757426.a4bd701242e7.1463.12
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:386090420fbf2ef4f38715a67450b94eeeb50438dc71d8bda8adf62e7a6ffc4a
|
3 |
+
size 4225
|
log/events.out.tfevents.1685757599.a4bd701242e7.1463.14
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a565fffd1d0ee06961d9e3a4f8539c0755413f5df8f59ae2a7354b8f9e3111f
|
3 |
+
size 4225
|
log/events.out.tfevents.1685757697.a4bd701242e7.1463.16
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af1623784d4e9e9c1bb5fdc05558d9af2bdb24be1948fac458c72b8da151daaf
|
3 |
+
size 4225
|
log/events.out.tfevents.1685757918.a4bd701242e7.1463.18
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12706bb7e31bcd1ecec8d76ebe263ab3cfd0012e3203f8cf220b9c2121d434d5
|
3 |
+
size 8362
|
log/events.out.tfevents.1685758037.a4bd701242e7.1463.21
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45ffc8cdea9bc2b075d30eb617e1db471b1e55b286eaa48eb66edd409b2c995b
|
3 |
+
size 8362
|
log/events.out.tfevents.1685758300.a4bd701242e7.1463.24
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7127328a18c566f2f5bca6f1f33a91e458db7797db3b77bea5e2e25101a059ae
|
3 |
+
size 4225
|
log/events.out.tfevents.1685758440.a4bd701242e7.1463.26
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df1ab1f56a5aa981aa786f5614ac663565aa7ac3cbae8d53807740bd14d0ce9f
|
3 |
+
size 4277
|
log/events.out.tfevents.1685762856.a4bd701242e7.1463.28
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:955eeb4a4d35fbfe966b56cbee304fda2dc22232105df79d93df0084780cdd02
|
3 |
+
size 4277
|
log/events.out.tfevents.1685762999.a4bd701242e7.1463.30
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b24eb0009d463921b2fcf33b3d2ff07b1577d364120c65b36f3844fb1353969
|
3 |
+
size 4277
|
log/events.out.tfevents.1685763165.a4bd701242e7.1463.32
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88ea2471a1d7290589ed2aca9b84ab5bb0085df016684e8720320b30daa6bd05
|
3 |
+
size 5056
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8b742086cb324c2581ecb5db994b4acb98b6f884b8bd0353787e1b5478dcf3a
|
3 |
+
size 734923037
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<|endoftext|>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "<|endoftext|>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<|endoftext|>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
tokenizer_config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": false,
|
3 |
+
"add_prefix_space": false,
|
4 |
+
"bos_token": {
|
5 |
+
"__type": "AddedToken",
|
6 |
+
"content": "<|endoftext|>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": true,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false
|
11 |
+
},
|
12 |
+
"clean_up_tokenization_spaces": true,
|
13 |
+
"eos_token": {
|
14 |
+
"__type": "AddedToken",
|
15 |
+
"content": "<|endoftext|>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": true,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false
|
20 |
+
},
|
21 |
+
"errors": "replace",
|
22 |
+
"model_max_length": 1024,
|
23 |
+
"pad_token": null,
|
24 |
+
"tokenizer_class": "GPT2Tokenizer",
|
25 |
+
"unk_token": {
|
26 |
+
"__type": "AddedToken",
|
27 |
+
"content": "<|endoftext|>",
|
28 |
+
"lstrip": false,
|
29 |
+
"normalized": true,
|
30 |
+
"rstrip": false,
|
31 |
+
"single_word": false
|
32 |
+
}
|
33 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3bf4d84e11d1fbd4b4cbab1e390ee91ecb66baf3d7702c2f1a1f93455338f4
|
3 |
+
size 3899
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|