Training in progress, step 500

Files changed (14) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ checkpoint-*/

config.json ADDED Viewed

+{
+  "_name_or_path": "EleutherAI/gpt-neo-125M",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPTNeoForCausalLM"
+  ],
+  "attention_dropout": 0,
+  "attention_layers": [
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local"
+  ],
+  "attention_types": [
+    [
+      [
+        "global",
+        "local"
+      ],
+      6
+    ]
+  ],
+  "bos_token_id": 50256,
+  "embed_dropout": 0,
+  "eos_token_id": 50256,
+  "gradient_checkpointing": false,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": null,
+  "layer_norm_epsilon": 1e-05,
+  "max_position_embeddings": 2048,
+  "model_type": "gpt_neo",
+  "num_heads": 12,
+  "num_layers": 12,
+  "resid_dropout": 0,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.28.0",
+  "use_cache": true,
+  "vocab_size": 50257,
+  "window_size": 256
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:835b18caaa5c65da5aac10393ba95b85665dba1339f307378690783a2b2f9fb7
+size 551186797

runs/Jun02_18-08-45_9956507f5fb8/1685729398.4258645/events.out.tfevents.1685729398.9956507f5fb8.4209.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:be7b9d5037deb69ec17a586f88d3c4442ddf7119f848f5564107647b6586b49e
+size 5891

runs/Jun02_18-08-45_9956507f5fb8/events.out.tfevents.1685729398.9956507f5fb8.4209.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a2a6d00d134a9cfdf76a13ef031fdd87ee0a93748f55b3dd595f1939c3025d9
+size 4414

runs/Jun02_18-12-25_9956507f5fb8/1685729553.227646/events.out.tfevents.1685729553.9956507f5fb8.4209.3 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbd1b4b11d606311f22ebbeaf2314d975edb866b4347cfba3c76b7fffaaf3e9f
+size 5891

runs/Jun02_18-12-25_9956507f5fb8/1685729613.9848425/events.out.tfevents.1685729613.9956507f5fb8.4209.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cce5713fdabea8a40996dbc978b034196a59eeba03ee2ad9100527a3344c67e6
+size 5891

runs/Jun02_18-12-25_9956507f5fb8/events.out.tfevents.1685729553.9956507f5fb8.4209.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c89f15df40c5a443de6f9d6710b3ca613ac8de16fadfb19a43e3db51194bec18
+size 4414

runs/Jun02_18-12-25_9956507f5fb8/events.out.tfevents.1685729613.9956507f5fb8.4209.4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c574c70d1ea1e7c1086c50d871d155f328ae13079d98f3c57e43a522395a13a5
+size 4571

special_tokens_map.json ADDED Viewed

+{
+  "bos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer_config.json ADDED Viewed

+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 2048,
+  "pad_token": null,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d3b7f819123cb8deba2adc00086741e552fc8aa4f3e13074577fa7c0f534206
+size 3579

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff