Upload 5 files
Browse files- .gitattributes +1 -0
- config.json +5 -2
- generation_config.json +8 -0
- special_tokens_map.json +6 -0
- tokenizer.json +0 -0
- tokenizer_config.json +7 -8
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
CHANGED
@@ -4,7 +4,7 @@
|
|
4 |
],
|
5 |
"attention_dropout": 0.0,
|
6 |
"bos_token_id": 1,
|
7 |
-
"eos_token_id":
|
8 |
"head_dim": 128,
|
9 |
"hidden_act": "silu",
|
10 |
"hidden_size": 5120,
|
@@ -15,12 +15,15 @@
|
|
15 |
"num_attention_heads": 32,
|
16 |
"num_hidden_layers": 50,
|
17 |
"num_key_value_heads": 8,
|
|
|
18 |
"rms_norm_eps": 1e-05,
|
|
|
19 |
"rope_theta": 1000000.0,
|
20 |
"sliding_window": null,
|
21 |
"tie_word_embeddings": false,
|
22 |
"torch_dtype": "bfloat16",
|
23 |
-
"transformers_version": "4.51.
|
|
|
24 |
"use_cache": true,
|
25 |
"vocab_size": 131072
|
26 |
}
|
|
|
4 |
],
|
5 |
"attention_dropout": 0.0,
|
6 |
"bos_token_id": 1,
|
7 |
+
"eos_token_id": 2,
|
8 |
"head_dim": 128,
|
9 |
"hidden_act": "silu",
|
10 |
"hidden_size": 5120,
|
|
|
15 |
"num_attention_heads": 32,
|
16 |
"num_hidden_layers": 50,
|
17 |
"num_key_value_heads": 8,
|
18 |
+
"pad_token_id": 10,
|
19 |
"rms_norm_eps": 1e-05,
|
20 |
+
"rope_scaling": null,
|
21 |
"rope_theta": 1000000.0,
|
22 |
"sliding_window": null,
|
23 |
"tie_word_embeddings": false,
|
24 |
"torch_dtype": "bfloat16",
|
25 |
+
"transformers_version": "4.51.3",
|
26 |
+
"unsloth_version": "2025.4.7",
|
27 |
"use_cache": true,
|
28 |
"vocab_size": 131072
|
29 |
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"max_length": 65536,
|
6 |
+
"pad_token_id": 10,
|
7 |
+
"transformers_version": "4.51.3"
|
8 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "<s>",
|
3 |
+
"eos_token": "<|im_end|>",
|
4 |
+
"pad_token": "<pad>",
|
5 |
+
"unk_token": "<unk>"
|
6 |
+
}
|
tokenizer.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
CHANGED
@@ -1,7 +1,4 @@
|
|
1 |
{
|
2 |
-
"add_bos_token": true,
|
3 |
-
"add_eos_token": false,
|
4 |
-
"add_prefix_space": false,
|
5 |
"added_tokens_decoder": {
|
6 |
"0": {
|
7 |
"content": "<unk>",
|
@@ -20,7 +17,7 @@
|
|
20 |
"special": true
|
21 |
},
|
22 |
"2": {
|
23 |
-
"content": "
|
24 |
"lstrip": false,
|
25 |
"normalized": false,
|
26 |
"rstrip": false,
|
@@ -116,7 +113,7 @@
|
|
116 |
"special": true
|
117 |
},
|
118 |
"14": {
|
119 |
-
"content": "
|
120 |
"lstrip": false,
|
121 |
"normalized": false,
|
122 |
"rstrip": false,
|
@@ -124,7 +121,7 @@
|
|
124 |
"special": true
|
125 |
},
|
126 |
"15": {
|
127 |
-
"content": "
|
128 |
"lstrip": false,
|
129 |
"normalized": false,
|
130 |
"rstrip": false,
|
@@ -8005,10 +8002,12 @@
|
|
8005 |
}
|
8006 |
},
|
8007 |
"bos_token": "<s>",
|
|
|
8008 |
"clean_up_tokenization_spaces": false,
|
8009 |
"eos_token": "<|im_end|>",
|
|
|
8010 |
"model_max_length": 1000000000000000019884624838656,
|
8011 |
-
"
|
8012 |
-
"
|
8013 |
"unk_token": "<unk>"
|
8014 |
}
|
|
|
1 |
{
|
|
|
|
|
|
|
2 |
"added_tokens_decoder": {
|
3 |
"0": {
|
4 |
"content": "<unk>",
|
|
|
17 |
"special": true
|
18 |
},
|
19 |
"2": {
|
20 |
+
"content": "<|im_end|>",
|
21 |
"lstrip": false,
|
22 |
"normalized": false,
|
23 |
"rstrip": false,
|
|
|
113 |
"special": true
|
114 |
},
|
115 |
"14": {
|
116 |
+
"content": "<SPECIAL_14>",
|
117 |
"lstrip": false,
|
118 |
"normalized": false,
|
119 |
"rstrip": false,
|
|
|
121 |
"special": true
|
122 |
},
|
123 |
"15": {
|
124 |
+
"content": "<SPECIAL_15>",
|
125 |
"lstrip": false,
|
126 |
"normalized": false,
|
127 |
"rstrip": false,
|
|
|
8002 |
}
|
8003 |
},
|
8004 |
"bos_token": "<s>",
|
8005 |
+
"chat_template": "{% if 'role' in messages[0] %}{% for message in messages %}{% if message['role'] == 'user' %}{{'<|im_start|>user\n' + message['content'] + '<|im_end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|im_start|>assistant\n' + message['content'] + '<|im_end|>\n' }}{% else %}{{ '<|im_start|>system\n' + message['content'] + '<|im_end|>\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}{% else %}{% for message in messages %}{% if message['from'] == 'human' %}{{'<|im_start|>user\n' + message['value'] + '<|im_end|>\n'}}{% elif message['from'] == 'gpt' %}{{'<|im_start|>assistant\n' + message['value'] + '<|im_end|>\n' }}{% else %}{{ '<|im_start|>system\n' + message['value'] + '<|im_end|>\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}{% endif %}",
|
8006 |
"clean_up_tokenization_spaces": false,
|
8007 |
"eos_token": "<|im_end|>",
|
8008 |
+
"extra_special_tokens": {},
|
8009 |
"model_max_length": 1000000000000000019884624838656,
|
8010 |
+
"pad_token": "<pad>",
|
8011 |
+
"tokenizer_class": "PreTrainedTokenizer",
|
8012 |
"unk_token": "<unk>"
|
8013 |
}
|