Commit
·
4569506
1
Parent(s):
55593bd
Trained with Unsloth
Browse filesUpload model trained with Unsloth 2x faster
- tokenizer.json +5 -0
tokenizer.json
CHANGED
@@ -34,6 +34,10 @@
|
|
34 |
"normalizer": {
|
35 |
"type": "Sequence",
|
36 |
"normalizers": [
|
|
|
|
|
|
|
|
|
37 |
{
|
38 |
"type": "Replace",
|
39 |
"pattern": {
|
@@ -130,6 +134,7 @@
|
|
130 |
"end_of_word_suffix": null,
|
131 |
"fuse_unk": true,
|
132 |
"byte_fallback": true,
|
|
|
133 |
"vocab": {
|
134 |
"<unk>": 0,
|
135 |
"<s>": 1,
|
|
|
34 |
"normalizer": {
|
35 |
"type": "Sequence",
|
36 |
"normalizers": [
|
37 |
+
{
|
38 |
+
"type": "Prepend",
|
39 |
+
"prepend": "▁"
|
40 |
+
},
|
41 |
{
|
42 |
"type": "Replace",
|
43 |
"pattern": {
|
|
|
134 |
"end_of_word_suffix": null,
|
135 |
"fuse_unk": true,
|
136 |
"byte_fallback": true,
|
137 |
+
"ignore_merges": false,
|
138 |
"vocab": {
|
139 |
"<unk>": 0,
|
140 |
"<s>": 1,
|