Training in progress, epoch 0

Browse files

Files changed (5) hide show

added_tokens.json +7 -0
config.json +8 -8
pytorch_model.bin +2 -2
tokenizer_config.json +51 -0
training_args.bin +2 -2

added_tokens.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "[CLS]": 2,
+  "[MASK]": 4,
+  "[PAD]": 0,
+  "[SEP]": 3,
+  "[UNK]": 1
+}

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "aubmindlab/bert-large-arabertv02-twitter",
   "architectures": [
     "BertForSequenceClassification"
   ],
@@ -10,16 +10,16 @@
   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "id2label": {
-    "0": "request",
-    "1": "complaint",
-    "2": "satisfaction"
   },
   "initializer_range": 0.02,
   "intermediate_size": 4096,
   "label2id": {
-    "complaint": 1,
-    "request": 0,
-    "satisfaction": 2
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
@@ -30,7 +30,7 @@
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
-  "transformers_version": "4.30.1",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 64000

 {
+  "_name_or_path": "Yousefmd/arabert-sentiment-classification",
   "architectures": [
     "BertForSequenceClassification"
   ],
   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
   },
   "initializer_range": 0.02,
   "intermediate_size": 4096,
   "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
+  "transformers_version": "4.34.0",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 64000

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:74ca9e2492bdeae5fe20e1154640fbc39f0ced5e5de51cbf8bdbd05bdb7c993f
-size 1477844597

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e922460ab2ed766fe340927ef23130b3886f9792f23b6dcca82649b9ccb3073
+size 1477840177

tokenizer_config.json CHANGED Viewed

@@ -1,21 +1,72 @@
 {
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": false,
   "mask_token": "[MASK]",
   "max_len": 512,
   "model_max_length": 512,
   "never_split": [
     "[بريد]",
     "[مستخدم]",
     "[رابط]"
   ],
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]",
   "use_fast": true
 }

 {
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": false,
+  "ignore_mismatched_sizes": true,
   "mask_token": "[MASK]",
   "max_len": 512,
+  "max_length": 128,
   "model_max_length": 512,
   "never_split": [
     "[بريد]",
     "[مستخدم]",
     "[رابط]"
   ],
+  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sep_token": "[SEP]",
+  "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "[UNK]",
   "use_fast": true
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:15b276cad04a08b5726b113ede2970a0bd785db37346244d5ce122f33977325b
-size 3963

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd4249ad5df8a68beaf61239ec0ca1b090169b797dc398439f233985546bd9e5
+size 4091