Training in progress, epoch 1

Files changed (4) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:234b43522056e755c3281687ad40458b1f3b8b220e3f1b0f6627475745075db4
 size 538440512

 version https://git-lfs.github.com/spec/v1
+oid sha256:365cb983ecc64b9ec33ecbce0444bb7d306eb22856312bb5a3d6f8ca6ade0d24
 size 538440512

special_tokens_map.json CHANGED Viewed

@@ -1,37 +1,7 @@
 {
-  "cls_token": {
-    "content": "[CLS]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "mask_token": {
-    "content": "[MASK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "[PAD]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "sep_token": {
-    "content": "[SEP]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "[UNK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
 }

 {
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
 }

tokenizer.json CHANGED Viewed

@@ -4,9 +4,18 @@
     "direction": "Right",
     "max_length": 384,
     "strategy": "OnlySecond",
-    "stride": 128
   },
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

     "direction": "Right",
     "max_length": 384,
     "strategy": "OnlySecond",
+    "stride": 0
+  },
+  "padding": {
+    "strategy": {
+      "Fixed": 384
+    },
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 31,
+    "pad_type_id": 0,
+    "pad_token": "[PAD]"
   },
   "added_tokens": [
     {
       "id": 0,

tokenizer_config.json CHANGED Viewed

@@ -295,7 +295,6 @@
   "do_lower_case": false,
   "mask_token": "[MASK]",
   "max_len": 512,
-  "max_length": 384,
   "model_max_length": 512,
   "never_split": [
     "+ك",
@@ -330,16 +329,10 @@
     "+ات",
     "[رابط]"
   ],
-  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
-  "pad_token_type_id": 0,
-  "padding_side": "right",
   "sep_token": "[SEP]",
-  "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
-  "truncation_side": "right",
-  "truncation_strategy": "only_second",
   "unk_token": "[UNK]"
 }

   "do_lower_case": false,
   "mask_token": "[MASK]",
   "max_len": 512,
   "model_max_length": 512,
   "never_split": [
     "+ك",
     "+ات",
     "[رابط]"
   ],
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]"
 }