helezabi commited on
Commit
ef5152a
·
1 Parent(s): cf66490

Training in progress, step 500

Browse files
Files changed (42) hide show
  1. .gitignore +1 -0
  2. config.json +41 -0
  3. log/1685756631.7457728/events.out.tfevents.1685756631.a4bd701242e7.1463.1 +3 -0
  4. log/1685756655.802506/events.out.tfevents.1685756655.a4bd701242e7.1463.3 +3 -0
  5. log/1685756682.4642992/events.out.tfevents.1685756682.a4bd701242e7.1463.5 +3 -0
  6. log/1685756820.2901652/events.out.tfevents.1685756820.a4bd701242e7.1463.7 +3 -0
  7. log/1685756968.7793558/events.out.tfevents.1685756968.a4bd701242e7.1463.9 +3 -0
  8. log/1685757339.4243653/events.out.tfevents.1685757339.a4bd701242e7.1463.11 +3 -0
  9. log/1685757426.9349952/events.out.tfevents.1685757426.a4bd701242e7.1463.13 +3 -0
  10. log/1685757599.0818408/events.out.tfevents.1685757599.a4bd701242e7.1463.15 +3 -0
  11. log/1685757697.210757/events.out.tfevents.1685757697.a4bd701242e7.1463.17 +3 -0
  12. log/1685757918.260184/events.out.tfevents.1685757918.a4bd701242e7.1463.19 +3 -0
  13. log/1685758028.454992/events.out.tfevents.1685758028.a4bd701242e7.1463.20 +3 -0
  14. log/1685758037.5097477/events.out.tfevents.1685758037.a4bd701242e7.1463.22 +3 -0
  15. log/1685758042.344527/events.out.tfevents.1685758042.a4bd701242e7.1463.23 +3 -0
  16. log/1685758300.7219527/events.out.tfevents.1685758300.a4bd701242e7.1463.25 +3 -0
  17. log/1685758440.5740914/events.out.tfevents.1685758440.a4bd701242e7.1463.27 +3 -0
  18. log/1685762856.0185945/events.out.tfevents.1685762856.a4bd701242e7.1463.29 +3 -0
  19. log/1685762999.8144422/events.out.tfevents.1685762999.a4bd701242e7.1463.31 +3 -0
  20. log/1685763165.374101/events.out.tfevents.1685763165.a4bd701242e7.1463.33 +3 -0
  21. log/events.out.tfevents.1685756631.a4bd701242e7.1463.0 +3 -0
  22. log/events.out.tfevents.1685756655.a4bd701242e7.1463.2 +3 -0
  23. log/events.out.tfevents.1685756682.a4bd701242e7.1463.4 +3 -0
  24. log/events.out.tfevents.1685756820.a4bd701242e7.1463.6 +3 -0
  25. log/events.out.tfevents.1685756968.a4bd701242e7.1463.8 +3 -0
  26. log/events.out.tfevents.1685757339.a4bd701242e7.1463.10 +3 -0
  27. log/events.out.tfevents.1685757426.a4bd701242e7.1463.12 +3 -0
  28. log/events.out.tfevents.1685757599.a4bd701242e7.1463.14 +3 -0
  29. log/events.out.tfevents.1685757697.a4bd701242e7.1463.16 +3 -0
  30. log/events.out.tfevents.1685757918.a4bd701242e7.1463.18 +3 -0
  31. log/events.out.tfevents.1685758037.a4bd701242e7.1463.21 +3 -0
  32. log/events.out.tfevents.1685758300.a4bd701242e7.1463.24 +3 -0
  33. log/events.out.tfevents.1685758440.a4bd701242e7.1463.26 +3 -0
  34. log/events.out.tfevents.1685762856.a4bd701242e7.1463.28 +3 -0
  35. log/events.out.tfevents.1685762999.a4bd701242e7.1463.30 +3 -0
  36. log/events.out.tfevents.1685763165.a4bd701242e7.1463.32 +3 -0
  37. merges.txt +0 -0
  38. pytorch_model.bin +3 -0
  39. special_tokens_map.json +23 -0
  40. tokenizer_config.json +33 -0
  41. training_args.bin +3 -0
  42. vocab.json +0 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "gpt2-medium",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 1024,
16
+ "n_head": 16,
17
+ "n_inner": null,
18
+ "n_layer": 24,
19
+ "n_positions": 1024,
20
+ "n_special": 0,
21
+ "predict_special_tokens": true,
22
+ "reorder_and_upcast_attn": false,
23
+ "resid_pdrop": 0.1,
24
+ "scale_attn_by_inverse_layer_idx": false,
25
+ "scale_attn_weights": true,
26
+ "summary_activation": null,
27
+ "summary_first_dropout": 0.1,
28
+ "summary_proj_to_labels": true,
29
+ "summary_type": "cls_index",
30
+ "summary_use_proj": true,
31
+ "task_specific_params": {
32
+ "text-generation": {
33
+ "do_sample": true,
34
+ "max_length": 50
35
+ }
36
+ },
37
+ "torch_dtype": "float16",
38
+ "transformers_version": "4.29.2",
39
+ "use_cache": true,
40
+ "vocab_size": 50257
41
+ }
log/1685756631.7457728/events.out.tfevents.1685756631.a4bd701242e7.1463.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a73d5f897136779c4549ac7a2ebaa340f9b5459afc07d3dc0505ae8c9a099d
3
+ size 5879
log/1685756655.802506/events.out.tfevents.1685756655.a4bd701242e7.1463.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf7504ecb232d53ed1485ca976f5fdb2a375146bc010be8ffc2590e1f1fbadd1
3
+ size 5879
log/1685756682.4642992/events.out.tfevents.1685756682.a4bd701242e7.1463.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4812f63b075ff3805ce893828f813a887565cf686209ec0e2ce81525d49a8bd3
3
+ size 5879
log/1685756820.2901652/events.out.tfevents.1685756820.a4bd701242e7.1463.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:484b33a788de078068087ed41388b1b756cefb762e266bf5b25a63c0b967778b
3
+ size 5879
log/1685756968.7793558/events.out.tfevents.1685756968.a4bd701242e7.1463.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c673594f716a7e8316b9f2902f2a11ac2ef52da628b1379275add912dfdcd08
3
+ size 5879
log/1685757339.4243653/events.out.tfevents.1685757339.a4bd701242e7.1463.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:920be2ceef0c0345bf468fc92d6c9584d80469f6077b2e089dcca58a6656010a
3
+ size 5879
log/1685757426.9349952/events.out.tfevents.1685757426.a4bd701242e7.1463.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6dd4c39048cea6cd6c29465f24c89003684021c477166f13ed2ccfc272496d1
3
+ size 5879
log/1685757599.0818408/events.out.tfevents.1685757599.a4bd701242e7.1463.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fff3eebd9050636a73a675b66d475625d09156eab320b599f3973baa47803226
3
+ size 5879
log/1685757697.210757/events.out.tfevents.1685757697.a4bd701242e7.1463.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6147ecf344b52c74559b6ddadebb81102c436e36b0dfb6d3d0ee8a6f468b57b9
3
+ size 5879
log/1685757918.260184/events.out.tfevents.1685757918.a4bd701242e7.1463.19 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2db3b327f6813c2cbd7ca0abb45a7bfd5b00665f263f7ad509dbe63de9f116bf
3
+ size 5879
log/1685758028.454992/events.out.tfevents.1685758028.a4bd701242e7.1463.20 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d41e3cadad8fce9d4c96e6842cf94ae8e7fde599c3f8baa5843a8e9bf39a58d
3
+ size 5879
log/1685758037.5097477/events.out.tfevents.1685758037.a4bd701242e7.1463.22 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17fdf71d6b145fb81dd4ec1aebd6f1fa095dcc5bf2e8a1bef7cc3b9e3987e497
3
+ size 5879
log/1685758042.344527/events.out.tfevents.1685758042.a4bd701242e7.1463.23 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bb6eca5b956a6831c5ca613b5b9f0da5f8f79321a0ca159accfebcd668e9ba7
3
+ size 5879
log/1685758300.7219527/events.out.tfevents.1685758300.a4bd701242e7.1463.25 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a09d28dd9d67d8bc24686d027e64d2b42498b5eada7aeb701ca0175a9bb3a7b
3
+ size 5879
log/1685758440.5740914/events.out.tfevents.1685758440.a4bd701242e7.1463.27 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d731ecf97991c73be2fc914726dcb228b499e6d06de261e95382f6ae905d240
3
+ size 5879
log/1685762856.0185945/events.out.tfevents.1685762856.a4bd701242e7.1463.29 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cece652662c9393137ff18427abb39dacfd78c25721ceeff16a7a0cf7fc93ac0
3
+ size 5879
log/1685762999.8144422/events.out.tfevents.1685762999.a4bd701242e7.1463.31 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f91ebe5af3723f28bfbdc78f46bd569431cdbe69c43c1442bb6717285687a9a
3
+ size 5879
log/1685763165.374101/events.out.tfevents.1685763165.a4bd701242e7.1463.33 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d0c9a11b3eb1b456696d0b2af395a6b7646c6ec6df12d9482aca7be78884f28
3
+ size 5875
log/events.out.tfevents.1685756631.a4bd701242e7.1463.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e64886843809c84fd6b59f3628b4b6c8a0fd29c0ca0ddcd03bbb12a783f0ee
3
+ size 4224
log/events.out.tfevents.1685756655.a4bd701242e7.1463.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:819599f7f845d6e65f98458cc6fe112c2dd308b3c3655097f71cedc5ff4ceb36
3
+ size 4224
log/events.out.tfevents.1685756682.a4bd701242e7.1463.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:708a1005dfa8cb26f68fc2b54f5c98a0dfca9dcb51959381318e5cca20b98e8c
3
+ size 4224
log/events.out.tfevents.1685756820.a4bd701242e7.1463.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1619e62a11d0604b6e8b5bffa8748312ac03de1bf1ea2257979c55285966ccf0
3
+ size 4225
log/events.out.tfevents.1685756968.a4bd701242e7.1463.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4425fa3c77b774fbbb2080b1c4cc11554f24297c7961b3e91c866c004b7c70b4
3
+ size 4225
log/events.out.tfevents.1685757339.a4bd701242e7.1463.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3552ed87d9b4d32bf66dea8cc956722b51f5c0db462c13c0c990479d7b1b21ac
3
+ size 4225
log/events.out.tfevents.1685757426.a4bd701242e7.1463.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:386090420fbf2ef4f38715a67450b94eeeb50438dc71d8bda8adf62e7a6ffc4a
3
+ size 4225
log/events.out.tfevents.1685757599.a4bd701242e7.1463.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a565fffd1d0ee06961d9e3a4f8539c0755413f5df8f59ae2a7354b8f9e3111f
3
+ size 4225
log/events.out.tfevents.1685757697.a4bd701242e7.1463.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af1623784d4e9e9c1bb5fdc05558d9af2bdb24be1948fac458c72b8da151daaf
3
+ size 4225
log/events.out.tfevents.1685757918.a4bd701242e7.1463.18 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12706bb7e31bcd1ecec8d76ebe263ab3cfd0012e3203f8cf220b9c2121d434d5
3
+ size 8362
log/events.out.tfevents.1685758037.a4bd701242e7.1463.21 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ffc8cdea9bc2b075d30eb617e1db471b1e55b286eaa48eb66edd409b2c995b
3
+ size 8362
log/events.out.tfevents.1685758300.a4bd701242e7.1463.24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7127328a18c566f2f5bca6f1f33a91e458db7797db3b77bea5e2e25101a059ae
3
+ size 4225
log/events.out.tfevents.1685758440.a4bd701242e7.1463.26 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df1ab1f56a5aa981aa786f5614ac663565aa7ac3cbae8d53807740bd14d0ce9f
3
+ size 4277
log/events.out.tfevents.1685762856.a4bd701242e7.1463.28 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955eeb4a4d35fbfe966b56cbee304fda2dc22232105df79d93df0084780cdd02
3
+ size 4277
log/events.out.tfevents.1685762999.a4bd701242e7.1463.30 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b24eb0009d463921b2fcf33b3d2ff07b1577d364120c65b36f3844fb1353969
3
+ size 4277
log/events.out.tfevents.1685763165.a4bd701242e7.1463.32 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ea2471a1d7290589ed2aca9b84ab5bb0085df016684e8720320b30daa6bd05
3
+ size 5056
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8b742086cb324c2581ecb5db994b4acb98b6f884b8bd0353787e1b5478dcf3a
3
+ size 734923037
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|endoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<|endoftext|>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "bos_token": {
5
+ "__type": "AddedToken",
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "clean_up_tokenization_spaces": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
+ "model_max_length": 1024,
23
+ "pad_token": null,
24
+ "tokenizer_class": "GPT2Tokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b3bf4d84e11d1fbd4b4cbab1e390ee91ecb66baf3d7702c2f1a1f93455338f4
3
+ size 3899
vocab.json ADDED
The diff for this file is too large to render. See raw diff