zzzmahesh commited on
Commit
e2bec7d
·
verified ·
1 Parent(s): 938d259

Upload tokenizer

Browse files
special_tokens_map.json CHANGED
@@ -12,5 +12,12 @@
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
 
 
 
 
 
 
 
15
  }
16
  }
 
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
  }
23
  }
tokenizer.json CHANGED
@@ -1,7 +1,14 @@
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 128000,
@@ -2306,6 +2313,15 @@
2306
  "rstrip": false,
2307
  "normalized": false,
2308
  "special": true
 
 
 
 
 
 
 
 
 
2309
  }
2310
  ],
2311
  "normalizer": null,
 
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
+ "padding": {
5
+ "strategy": "BatchLongest",
6
+ "direction": "Right",
7
+ "pad_to_multiple_of": null,
8
+ "pad_id": 128256,
9
+ "pad_type_id": 0,
10
+ "pad_token": "[PAD]"
11
+ },
12
  "added_tokens": [
13
  {
14
  "id": 128000,
 
2313
  "rstrip": false,
2314
  "normalized": false,
2315
  "special": true
2316
+ },
2317
+ {
2318
+ "id": 128256,
2319
+ "content": "[PAD]",
2320
+ "single_word": false,
2321
+ "lstrip": false,
2322
+ "rstrip": false,
2323
+ "normalized": false,
2324
+ "special": true
2325
  }
2326
  ],
2327
  "normalizer": null,
tokenizer_config.json CHANGED
@@ -2047,6 +2047,14 @@
2047
  "rstrip": false,
2048
  "single_word": false,
2049
  "special": true
 
 
 
 
 
 
 
 
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
@@ -2058,5 +2066,6 @@
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 1000000000000000019884624838656,
 
2061
  "tokenizer_class": "PreTrainedTokenizerFast"
2062
  }
 
2047
  "rstrip": false,
2048
  "single_word": false,
2049
  "special": true
2050
+ },
2051
+ "128256": {
2052
+ "content": "[PAD]",
2053
+ "lstrip": false,
2054
+ "normalized": false,
2055
+ "rstrip": false,
2056
+ "single_word": false,
2057
+ "special": true
2058
  }
2059
  },
2060
  "bos_token": "<|begin_of_text|>",
 
2066
  "attention_mask"
2067
  ],
2068
  "model_max_length": 1000000000000000019884624838656,
2069
+ "pad_token": "[PAD]",
2070
  "tokenizer_class": "PreTrainedTokenizerFast"
2071
  }