Vishnou
/

distilbert_base_SST2

Text Classification

Generated from Trainer

Inference Endpoints

Model card Files Files and versions Community

Vishnou commited on Nov 18, 2023

Commit

b108c04

·

1 Parent(s): 240862b

Upload tokenizer

Files changed (2) hide show

tokenizer.json +16 -2
tokenizer_config.json +0 -2

tokenizer.json CHANGED Viewed

@@ -1,7 +1,21 @@
 {
   "version": "1.0",
-  "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 65,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
+  "padding": {
+    "strategy": {
+      "Fixed": 65
+    },
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 0,
+    "pad_type_id": 0,
+    "pad_token": "[PAD]"
+  },
   "added_tokens": [
     {
       "id": 0,

tokenizer_config.json CHANGED Viewed

@@ -43,12 +43,10 @@
   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
-  "do_basic_tokenize": true,
   "do_lower_case": true,
   "mask_token": "[MASK]",
   "max_length": 65,
   "model_max_length": 512,
-  "never_split": null,
   "pad_token": "[PAD]",
   "padding": "max_length",
   "sep_token": "[SEP]",

   },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_lower_case": true,
   "mask_token": "[MASK]",
   "max_length": 65,
   "model_max_length": 512,
   "pad_token": "[PAD]",
   "padding": "max_length",
   "sep_token": "[SEP]",