teknium commited on
Commit
5590cc6
·
verified ·
1 Parent(s): 20776db

Upload tokenizer.json

Browse files
Files changed (1) hide show
  1. tokenizer.json +30 -30
tokenizer.json CHANGED
@@ -104,7 +104,7 @@
104
  },
105
  {
106
  "id": 128011,
107
- "content": "<tools>",
108
  "single_word": false,
109
  "lstrip": false,
110
  "rstrip": false,
@@ -113,7 +113,7 @@
113
  },
114
  {
115
  "id": 128012,
116
- "content": "</tools>",
117
  "single_word": false,
118
  "lstrip": false,
119
  "rstrip": false,
@@ -140,7 +140,7 @@
140
  },
141
  {
142
  "id": 128015,
143
- "content": "<schema>",
144
  "single_word": false,
145
  "lstrip": false,
146
  "rstrip": false,
@@ -149,7 +149,7 @@
149
  },
150
  {
151
  "id": 128016,
152
- "content": "</schema>",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
@@ -158,7 +158,7 @@
158
  },
159
  {
160
  "id": 128017,
161
- "content": "<scratch_pad>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
@@ -167,7 +167,7 @@
167
  },
168
  {
169
  "id": 128018,
170
- "content": "</scratch_pad>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
@@ -176,7 +176,7 @@
176
  },
177
  {
178
  "id": 128019,
179
- "content": "<SCRATCHPAD>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
@@ -185,7 +185,7 @@
185
  },
186
  {
187
  "id": 128020,
188
- "content": "</SCRATCHPAD>",
189
  "single_word": false,
190
  "lstrip": false,
191
  "rstrip": false,
@@ -194,7 +194,7 @@
194
  },
195
  {
196
  "id": 128021,
197
- "content": "<REASONING>",
198
  "single_word": false,
199
  "lstrip": false,
200
  "rstrip": false,
@@ -203,7 +203,7 @@
203
  },
204
  {
205
  "id": 128022,
206
- "content": "</REASONING>",
207
  "single_word": false,
208
  "lstrip": false,
209
  "rstrip": false,
@@ -212,7 +212,7 @@
212
  },
213
  {
214
  "id": 128023,
215
- "content": "<INNER_MONOLOGUE>",
216
  "single_word": false,
217
  "lstrip": false,
218
  "rstrip": false,
@@ -221,7 +221,7 @@
221
  },
222
  {
223
  "id": 128024,
224
- "content": "</INNER_MONOLOGUE>",
225
  "single_word": false,
226
  "lstrip": false,
227
  "rstrip": false,
@@ -230,7 +230,7 @@
230
  },
231
  {
232
  "id": 128025,
233
- "content": "<PLAN>",
234
  "single_word": false,
235
  "lstrip": false,
236
  "rstrip": false,
@@ -239,7 +239,7 @@
239
  },
240
  {
241
  "id": 128026,
242
- "content": "</PLAN>",
243
  "single_word": false,
244
  "lstrip": false,
245
  "rstrip": false,
@@ -248,7 +248,7 @@
248
  },
249
  {
250
  "id": 128027,
251
- "content": "<EXECUTION>",
252
  "single_word": false,
253
  "lstrip": false,
254
  "rstrip": false,
@@ -257,7 +257,7 @@
257
  },
258
  {
259
  "id": 128028,
260
- "content": "</EXECUTION>",
261
  "single_word": false,
262
  "lstrip": false,
263
  "rstrip": false,
@@ -266,7 +266,7 @@
266
  },
267
  {
268
  "id": 128029,
269
- "content": "<REFLECTION>",
270
  "single_word": false,
271
  "lstrip": false,
272
  "rstrip": false,
@@ -275,7 +275,7 @@
275
  },
276
  {
277
  "id": 128030,
278
- "content": "</REFLECTION>",
279
  "single_word": false,
280
  "lstrip": false,
281
  "rstrip": false,
@@ -284,7 +284,7 @@
284
  },
285
  {
286
  "id": 128031,
287
- "content": "<THINKING>",
288
  "single_word": false,
289
  "lstrip": false,
290
  "rstrip": false,
@@ -293,7 +293,7 @@
293
  },
294
  {
295
  "id": 128032,
296
- "content": "</THINKING>",
297
  "single_word": false,
298
  "lstrip": false,
299
  "rstrip": false,
@@ -302,7 +302,7 @@
302
  },
303
  {
304
  "id": 128033,
305
- "content": "<SOLUTION>",
306
  "single_word": false,
307
  "lstrip": false,
308
  "rstrip": false,
@@ -311,7 +311,7 @@
311
  },
312
  {
313
  "id": 128034,
314
- "content": "</SOLUTION>",
315
  "single_word": false,
316
  "lstrip": false,
317
  "rstrip": false,
@@ -320,7 +320,7 @@
320
  },
321
  {
322
  "id": 128035,
323
- "content": "<EXPLANATION>",
324
  "single_word": false,
325
  "lstrip": false,
326
  "rstrip": false,
@@ -329,7 +329,7 @@
329
  },
330
  {
331
  "id": 128036,
332
- "content": "</EXPLANATION>",
333
  "single_word": false,
334
  "lstrip": false,
335
  "rstrip": false,
@@ -338,7 +338,7 @@
338
  },
339
  {
340
  "id": 128037,
341
- "content": "<UNIT_TEST>",
342
  "single_word": false,
343
  "lstrip": false,
344
  "rstrip": false,
@@ -347,25 +347,25 @@
347
  },
348
  {
349
  "id": 128038,
350
- "content": "</UNIT_TEST>",
351
  "single_word": false,
352
  "lstrip": false,
353
  "rstrip": false,
354
  "normalized": false,
355
- "special": false
356
  },
357
  {
358
  "id": 128039,
359
- "content": "<|im_end|>",
360
  "single_word": false,
361
  "lstrip": false,
362
  "rstrip": false,
363
  "normalized": false,
364
- "special": true
365
  },
366
  {
367
  "id": 128040,
368
- "content": "<|im_start|>",
369
  "single_word": false,
370
  "lstrip": false,
371
  "rstrip": false,
 
104
  },
105
  {
106
  "id": 128011,
107
+ "content": "<think>",
108
  "single_word": false,
109
  "lstrip": false,
110
  "rstrip": false,
 
113
  },
114
  {
115
  "id": 128012,
116
+ "content": "</think>",
117
  "single_word": false,
118
  "lstrip": false,
119
  "rstrip": false,
 
140
  },
141
  {
142
  "id": 128015,
143
+ "content": "<|reserved_special_token_7|>",
144
  "single_word": false,
145
  "lstrip": false,
146
  "rstrip": false,
 
149
  },
150
  {
151
  "id": 128016,
152
+ "content": "<|reserved_special_token_8|>",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
 
158
  },
159
  {
160
  "id": 128017,
161
+ "content": "<|reserved_special_token_9|>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
 
167
  },
168
  {
169
  "id": 128018,
170
+ "content": "<|reserved_special_token_10|>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
 
176
  },
177
  {
178
  "id": 128019,
179
+ "content": "<|reserved_special_token_11|>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
 
185
  },
186
  {
187
  "id": 128020,
188
+ "content": "<|reserved_special_token_12|>",
189
  "single_word": false,
190
  "lstrip": false,
191
  "rstrip": false,
 
194
  },
195
  {
196
  "id": 128021,
197
+ "content": "<|reserved_special_token_13|>",
198
  "single_word": false,
199
  "lstrip": false,
200
  "rstrip": false,
 
203
  },
204
  {
205
  "id": 128022,
206
+ "content": "<|reserved_special_token_14|>",
207
  "single_word": false,
208
  "lstrip": false,
209
  "rstrip": false,
 
212
  },
213
  {
214
  "id": 128023,
215
+ "content": "<|reserved_special_token_15|>",
216
  "single_word": false,
217
  "lstrip": false,
218
  "rstrip": false,
 
221
  },
222
  {
223
  "id": 128024,
224
+ "content": "<|reserved_special_token_16|>",
225
  "single_word": false,
226
  "lstrip": false,
227
  "rstrip": false,
 
230
  },
231
  {
232
  "id": 128025,
233
+ "content": "<|reserved_special_token_17|>",
234
  "single_word": false,
235
  "lstrip": false,
236
  "rstrip": false,
 
239
  },
240
  {
241
  "id": 128026,
242
+ "content": "<|reserved_special_token_18|>",
243
  "single_word": false,
244
  "lstrip": false,
245
  "rstrip": false,
 
248
  },
249
  {
250
  "id": 128027,
251
+ "content": "<|reserved_special_token_19|>",
252
  "single_word": false,
253
  "lstrip": false,
254
  "rstrip": false,
 
257
  },
258
  {
259
  "id": 128028,
260
+ "content": "<|reserved_special_token_20|>",
261
  "single_word": false,
262
  "lstrip": false,
263
  "rstrip": false,
 
266
  },
267
  {
268
  "id": 128029,
269
+ "content": "<|reserved_special_token_21|>",
270
  "single_word": false,
271
  "lstrip": false,
272
  "rstrip": false,
 
275
  },
276
  {
277
  "id": 128030,
278
+ "content": "<|reserved_special_token_22|>",
279
  "single_word": false,
280
  "lstrip": false,
281
  "rstrip": false,
 
284
  },
285
  {
286
  "id": 128031,
287
+ "content": "<|reserved_special_token_23|>",
288
  "single_word": false,
289
  "lstrip": false,
290
  "rstrip": false,
 
293
  },
294
  {
295
  "id": 128032,
296
+ "content": "<|reserved_special_token_24|>",
297
  "single_word": false,
298
  "lstrip": false,
299
  "rstrip": false,
 
302
  },
303
  {
304
  "id": 128033,
305
+ "content": "<|reserved_special_token_25|>",
306
  "single_word": false,
307
  "lstrip": false,
308
  "rstrip": false,
 
311
  },
312
  {
313
  "id": 128034,
314
+ "content": "<|reserved_special_token_26|>",
315
  "single_word": false,
316
  "lstrip": false,
317
  "rstrip": false,
 
320
  },
321
  {
322
  "id": 128035,
323
+ "content": "<|reserved_special_token_27|>",
324
  "single_word": false,
325
  "lstrip": false,
326
  "rstrip": false,
 
329
  },
330
  {
331
  "id": 128036,
332
+ "content": "<|reserved_special_token_28|>",
333
  "single_word": false,
334
  "lstrip": false,
335
  "rstrip": false,
 
338
  },
339
  {
340
  "id": 128037,
341
+ "content": "<|reserved_special_token_29|>",
342
  "single_word": false,
343
  "lstrip": false,
344
  "rstrip": false,
 
347
  },
348
  {
349
  "id": 128038,
350
+ "content": "<|reserved_special_token_30|>",
351
  "single_word": false,
352
  "lstrip": false,
353
  "rstrip": false,
354
  "normalized": false,
355
+ "special": true
356
  },
357
  {
358
  "id": 128039,
359
+ "content": "<|reserved_special_token_31|>",
360
  "single_word": false,
361
  "lstrip": false,
362
  "rstrip": false,
363
  "normalized": false,
364
+ "special": false
365
  },
366
  {
367
  "id": 128040,
368
+ "content": "<|reserved_special_token_32|>",
369
  "single_word": false,
370
  "lstrip": false,
371
  "rstrip": false,