burakaytan commited on
Commit
15b8dea
1 Parent(s): ed5a1c3

Upload 8 files

Browse files
Files changed (8) hide show
  1. config.json +26 -0
  2. merges.txt +0 -0
  3. optimizer.pt +3 -0
  4. pytorch_model.bin +3 -0
  5. rng_state.pth +3 -0
  6. scheduler.pt +3 -0
  7. training_args.bin +3 -0
  8. vocab.json +0 -0
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "RobertaTurkish",
3
+ "architectures": [
4
+ "RobertaForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 514,
17
+ "model_type": "roberta",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "transformers_version": "4.8.2",
23
+ "type_vocab_size": 1,
24
+ "use_cache": true,
25
+ "vocab_size": 50265
26
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7149cc232fbc327fa61c6bdf6d7e23a5d880cf826e1f0064df13a13dccf0c6e0
3
+ size 997706595
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1313f2f46b3272303a77391a4a2007332019ba429177f0c2f12892ce8f4a9a5
3
+ size 498880850
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:241f53343ed7ff64a02ed3435cc351a74dc3b0e0208ba1bcb5b3cfa7c6269fb9
3
+ size 15690
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16b7e5a8249bb1ccc0c9fd2f2f489177411be13a6166921d4d6d3e5a1e5c3565
3
+ size 623
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56de9374b3077bddd600535696f675040aae308ad9c2dea86421d2ce409119db
3
+ size 2607
vocab.json ADDED
The diff for this file is too large to render. See raw diff