typeof
/

all-MiniLM-L6-v2-decoder

Text Generation

Inference Endpoints

Model card Files Files and versions Community

typeof commited on Jun 15, 2024

Commit

62fd940

·

1 Parent(s): ae303c9

init

Files changed (1) hide show

tokenizer.json +1 -76

tokenizer.json CHANGED Viewed

@@ -59,81 +59,6 @@
   "pre_tokenizer": {
     "type": "BertPreTokenizer"
   },
-  "post_processor": {
-    "type": "TemplateProcessing",
-    "single": [
-      {
-        "SpecialToken": {
-          "id": "[CLS]",
-          "type_id": 0
-        }
-      },
-      {
-        "Sequence": {
-          "id": "A",
-          "type_id": 0
-        }
-      },
-      {
-        "SpecialToken": {
-          "id": "[SEP]",
-          "type_id": 0
-        }
-      }
-    ],
-    "pair": [
-      {
-        "SpecialToken": {
-          "id": "[CLS]",
-          "type_id": 0
-        }
-      },
-      {
-        "Sequence": {
-          "id": "A",
-          "type_id": 0
-        }
-      },
-      {
-        "SpecialToken": {
-          "id": "[SEP]",
-          "type_id": 0
-        }
-      },
-      {
-        "Sequence": {
-          "id": "B",
-          "type_id": 1
-        }
-      },
-      {
-        "SpecialToken": {
-          "id": "[SEP]",
-          "type_id": 1
-        }
-      }
-    ],
-    "special_tokens": {
-      "[CLS]": {
-        "id": "[CLS]",
-        "ids": [
-          101
-        ],
-        "tokens": [
-          "[CLS]"
-        ]
-      },
-      "[SEP]": {
-        "id": "[SEP]",
-        "ids": [
-          102
-        ],
-        "tokens": [
-          "[SEP]"
-        ]
-      }
-    }
-  },
   "decoder": {
     "type": "WordPiece",
     "prefix": "##",
@@ -146,7 +71,7 @@
     "max_input_chars_per_word": 100,
     "vocab": {
       "[PAD]": 0,
-      "[unused0]": 1,
       "[unused1]": 2,
       "[unused2]": 3,
       "[unused3]": 4,

   "pre_tokenizer": {
     "type": "BertPreTokenizer"
   },
   "decoder": {
     "type": "WordPiece",
     "prefix": "##",
     "max_input_chars_per_word": 100,
     "vocab": {
       "[PAD]": 0,
+      "[EOS]": 1,
       "[unused1]": 2,
       "[unused2]": 3,
       "[unused3]": 4,