WhiteAngelss
/

bert-base-turkish-cased

Text Classification

Inference Endpoints

Model card Files Files and versions Community

WhiteAngels commited on Jul 25, 2024

Commit

f7f2bcd

·

verified ·

1 Parent(s): ce691b9

Update tokenizer_config.json

Files changed (1) hide show

tokenizer_config.json +19 -1

tokenizer_config.json CHANGED Viewed

@@ -23,16 +23,34 @@
       "rstrip": false,
       "single_word": false,
       "special": true
   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": true,
   "max_len": 512,
   "model_max_length": 512,
   "never_split": null,
   "pad_token": "[PAD]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",

       "rstrip": false,
       "single_word": false,
       "special": true
+    },
+    "3": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": true,
+  "mask_token": "[MASK]",
   "max_len": 512,
   "model_max_length": 512,
   "never_split": null,
   "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",