Doron Adler commited on
Commit
09936fd
1 Parent(s): 19363c0

Checkpoint 57900

Browse files
Files changed (3) hide show
  1. config.json +2 -1
  2. flax_model.msgpack +1 -1
  3. pytorch_model.bin +2 -2
config.json CHANGED
@@ -40,7 +40,6 @@
40
  ]
41
  ],
42
  "bos_token_id": 50256,
43
- "pad_token_id": 50256,
44
  "embed_dropout": 0,
45
  "eos_token_id": 50256,
46
  "gradient_checkpointing": false,
@@ -52,12 +51,14 @@
52
  "model_type": "gpt_neo",
53
  "num_heads": 16,
54
  "num_layers": 24,
 
55
  "resid_dropout": 0,
56
  "summary_activation": null,
57
  "summary_first_dropout": 0.1,
58
  "summary_proj_to_labels": true,
59
  "summary_type": "cls_index",
60
  "summary_use_proj": true,
 
61
  "transformers_version": "4.9.0.dev0",
62
  "use_cache": true,
63
  "vocab_size": 50257,
 
40
  ]
41
  ],
42
  "bos_token_id": 50256,
 
43
  "embed_dropout": 0,
44
  "eos_token_id": 50256,
45
  "gradient_checkpointing": false,
 
51
  "model_type": "gpt_neo",
52
  "num_heads": 16,
53
  "num_layers": 24,
54
+ "pad_token_id": 50256,
55
  "resid_dropout": 0,
56
  "summary_activation": null,
57
  "summary_first_dropout": 0.1,
58
  "summary_proj_to_labels": true,
59
  "summary_type": "cls_index",
60
  "summary_use_proj": true,
61
+ "torch_dtype": "float32",
62
  "transformers_version": "4.9.0.dev0",
63
  "use_cache": true,
64
  "vocab_size": 50257,
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba645564e45dda013c08946b5814e847188508d452093e072d788c63317acf22
3
  size 5262314590
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57be347ec53e5550d01671a4a120ec5c9aa302452bfb250a6df75eb6ba97c180
3
  size 5262314590
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:236b7d79acdbd44a7d15e0bd2ff1f8a1f1dc51834e73847f0f7590f71373e1c5
3
- size 5312754283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4241205e50ef9c053b7e1c85c69b4911ef33109660db8182280698d50abab1bc
3
+ size 5312753707