Upload folder using huggingface_hub
Browse files- .gitattributes +1 -0
- chat_template.jinja +1 -0
- model-00001-of-000017.safetensors +3 -0
- model-00002-of-000017.safetensors +3 -0
- model-00003-of-000017.safetensors +3 -0
- model-00004-of-000017.safetensors +3 -0
- model-00005-of-000017.safetensors +3 -0
- model-00006-of-000017.safetensors +3 -0
- model-00007-of-000017.safetensors +3 -0
- model-00008-of-000017.safetensors +3 -0
- model-00009-of-000017.safetensors +3 -0
- model-00010-of-000017.safetensors +3 -0
- model-00011-of-000017.safetensors +3 -0
- model-00012-of-000017.safetensors +3 -0
- model-00013-of-000017.safetensors +3 -0
- model-00014-of-000017.safetensors +3 -0
- model-00015-of-000017.safetensors +3 -0
- model-00016-of-000017.safetensors +3 -0
- model-00017-of-000017.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer_config.json +11 -11
.gitattributes
CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
figures/benchmark.jpg filter=lfs diff=lfs merge=lfs -text
|
|
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
figures/benchmark.jpg filter=lfs diff=lfs merge=lfs -text
|
37 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
chat_template.jinja
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<|Assistant|><|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<|tool▁call▁end|>'}}{%- set ns.is_first = true -%}{%- else %}{{'\n' + '<|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<|tool▁call▁end|>'}}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<|tool▁outputs▁end|>' + message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<|Assistant|>' + content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<|tool▁outputs▁begin|><|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\n<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<|tool▁outputs▁end|>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<|Assistant|><think>\n'}}{% endif %}
|
model-00001-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f57a2538539d61f9f22785d3c48f089227829948ee66572808dd13d5b08d63e
|
3 |
+
size 8946552810
|
model-00002-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f948c2df3e4f3e678e1b4c75b345ce646c4843a23e7c9089462cf3995d2af45
|
3 |
+
size 8690800055
|
model-00003-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa4b0afa70d26873dabc927e59b7dbc24a0e8eda323d4fdba17927d316d3516c
|
3 |
+
size 1577092016
|
model-00004-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:077f51bc9eb56b50868cb95c7cf0d6d0f0a524b824ba3af8b248c78a46593e97
|
3 |
+
size 8690767122
|
model-00005-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e826381017b2d8a9d8704be34ee0e0ceeb0a3a9abca27beaa4555d370d5a4f10
|
3 |
+
size 8422331428
|
model-00006-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1d4326d0d4187830fcea956d8ccfafbf6871fa7baed1b759c1ed843cafe92c0
|
3 |
+
size 8690767122
|
model-00007-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62a83ba7af95d532065e46322ae2c17ee020c3c8e92b7285420c09ca0d6f68f0
|
3 |
+
size 8422331428
|
model-00008-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8189753d14d5f9b3c31466d1f5a185bb7ffc7fc346cbc06a5453e48e07c2b97b
|
3 |
+
size 8690767122
|
model-00009-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:928bea3ae97c3962b3eb3f51a66f674be4cd5858caae541becd3e175f3305403
|
3 |
+
size 8422331428
|
model-00010-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1db6d4f8387897b0f40e505310a1542f6d0308370526fa86c42cdc99451d2200
|
3 |
+
size 8690767122
|
model-00011-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a5eb90d0773f1514ae7b240ed62961412e48f9eb160fdac6226221b87fe61f
|
3 |
+
size 8422331428
|
model-00012-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d01c2823a0393ded7f97556995b69965dad78665664853f1c8a2be901e643a44
|
3 |
+
size 8690767122
|
model-00013-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c43532c1b128f0135edc587ace540dfa53759916836960db06b73ab718e5eca
|
3 |
+
size 8422331428
|
model-00014-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f2ce0194b017ae009448602d7fd4ac24d7f25059c0a87d42fc496000f7bdacc
|
3 |
+
size 8690767122
|
model-00015-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:572ed974eb237aacf3de9ddfeaa373c62d39038a96ffd7f2beec6ea8f8a7b16e
|
3 |
+
size 8422331428
|
model-00016-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5a581377b62f0a918bf515d05f2514281eec031ea2748e7ce8123b910403bba
|
3 |
+
size 8690767122
|
model-00017-of-000017.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:605b29e86ec80aaa3a38bb3aab4bc859e4df26928fe49bbca00f127f55897e8d
|
3 |
+
size 10523694303
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
CHANGED
@@ -4,7 +4,7 @@
|
|
4 |
"add_prefix_space": null,
|
5 |
"added_tokens_decoder": {
|
6 |
"128000": {
|
7 |
-
"content": "
|
8 |
"lstrip": false,
|
9 |
"normalized": false,
|
10 |
"rstrip": false,
|
@@ -12,7 +12,7 @@
|
|
12 |
"special": true
|
13 |
},
|
14 |
"128001": {
|
15 |
-
"content": "
|
16 |
"lstrip": false,
|
17 |
"normalized": false,
|
18 |
"rstrip": false,
|
@@ -92,7 +92,7 @@
|
|
92 |
"special": true
|
93 |
},
|
94 |
"128011": {
|
95 |
-
"content": "
|
96 |
"lstrip": false,
|
97 |
"normalized": false,
|
98 |
"rstrip": false,
|
@@ -100,7 +100,7 @@
|
|
100 |
"special": false
|
101 |
},
|
102 |
"128012": {
|
103 |
-
"content": "
|
104 |
"lstrip": false,
|
105 |
"normalized": false,
|
106 |
"rstrip": false,
|
@@ -124,7 +124,7 @@
|
|
124 |
"special": false
|
125 |
},
|
126 |
"128015": {
|
127 |
-
"content": "
|
128 |
"lstrip": false,
|
129 |
"normalized": false,
|
130 |
"rstrip": false,
|
@@ -2052,17 +2052,17 @@
|
|
2052 |
"special": true
|
2053 |
}
|
2054 |
},
|
2055 |
-
"bos_token": "
|
2056 |
-
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<|Assistant|><|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<|tool▁call▁end|>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<|tool▁call▁end|>'}}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<|tool▁outputs▁end|>' + message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<|Assistant|>' + content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<|tool▁outputs▁begin|><|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<|tool▁outputs▁end|>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<|Assistant|><think>\\n'}}{% endif %}",
|
2057 |
"clean_up_tokenization_spaces": false,
|
2058 |
-
"eos_token": "
|
2059 |
"extra_special_tokens": {},
|
2060 |
"legacy": true,
|
2061 |
-
"model_max_length":
|
2062 |
"pad_token": "<|finetune_right_pad_id|>",
|
2063 |
"padding_side": "left",
|
2064 |
"sp_model_kwargs": {},
|
2065 |
"tokenizer_class": "LlamaTokenizerFast",
|
2066 |
"unk_token": null,
|
2067 |
-
"use_default_system_prompt": false
|
2068 |
-
}
|
|
|
|
4 |
"add_prefix_space": null,
|
5 |
"added_tokens_decoder": {
|
6 |
"128000": {
|
7 |
+
"content": "<\uff5cbegin\u2581of\u2581sentence\uff5c>",
|
8 |
"lstrip": false,
|
9 |
"normalized": false,
|
10 |
"rstrip": false,
|
|
|
12 |
"special": true
|
13 |
},
|
14 |
"128001": {
|
15 |
+
"content": "<\uff5cend\u2581of\u2581sentence\uff5c>",
|
16 |
"lstrip": false,
|
17 |
"normalized": false,
|
18 |
"rstrip": false,
|
|
|
92 |
"special": true
|
93 |
},
|
94 |
"128011": {
|
95 |
+
"content": "<\uff5cUser\uff5c>",
|
96 |
"lstrip": false,
|
97 |
"normalized": false,
|
98 |
"rstrip": false,
|
|
|
100 |
"special": false
|
101 |
},
|
102 |
"128012": {
|
103 |
+
"content": "<\uff5cAssistant\uff5c>",
|
104 |
"lstrip": false,
|
105 |
"normalized": false,
|
106 |
"rstrip": false,
|
|
|
124 |
"special": false
|
125 |
},
|
126 |
"128015": {
|
127 |
+
"content": "<\uff5c\u2581pad\u2581\uff5c>",
|
128 |
"lstrip": false,
|
129 |
"normalized": false,
|
130 |
"rstrip": false,
|
|
|
2052 |
"special": true
|
2053 |
}
|
2054 |
},
|
2055 |
+
"bos_token": "<\uff5cbegin\u2581of\u2581sentence\uff5c>",
|
|
|
2056 |
"clean_up_tokenization_spaces": false,
|
2057 |
+
"eos_token": "<\uff5cend\u2581of\u2581sentence\uff5c>",
|
2058 |
"extra_special_tokens": {},
|
2059 |
"legacy": true,
|
2060 |
+
"model_max_length": 16384,
|
2061 |
"pad_token": "<|finetune_right_pad_id|>",
|
2062 |
"padding_side": "left",
|
2063 |
"sp_model_kwargs": {},
|
2064 |
"tokenizer_class": "LlamaTokenizerFast",
|
2065 |
"unk_token": null,
|
2066 |
+
"use_default_system_prompt": false,
|
2067 |
+
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<\uff5cUser\uff5c>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<\uff5cAssistant\uff5c><\uff5ctool\u2581calls\u2581begin\uff5c><\uff5ctool\u2581call\u2581begin\uff5c>' + tool['type'] + '<\uff5ctool\u2581sep\uff5c>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<\uff5ctool\u2581call\u2581end\uff5c>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<\uff5ctool\u2581call\u2581begin\uff5c>' + tool['type'] + '<\uff5ctool\u2581sep\uff5c>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<\uff5ctool\u2581call\u2581end\uff5c>'}}{{'<\uff5ctool\u2581calls\u2581end\uff5c><\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<\uff5ctool\u2581outputs\u2581end\uff5c>' + message['content'] + '<\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<\uff5cAssistant\uff5c>' + content + '<\uff5cend\u2581of\u2581sentence\uff5c>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<\uff5ctool\u2581outputs\u2581begin\uff5c><\uff5ctool\u2581output\u2581begin\uff5c>' + message['content'] + '<\uff5ctool\u2581output\u2581end\uff5c>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<\uff5ctool\u2581output\u2581begin\uff5c>' + message['content'] + '<\uff5ctool\u2581output\u2581end\uff5c>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<\uff5ctool\u2581outputs\u2581end\uff5c>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<\uff5cAssistant\uff5c><think>\\n'}}{% endif %}"
|
2068 |
+
}
|