Commit
·
244ace8
1
Parent(s):
2f79652
Upload DeepSeek-R1-Distill ONNX models
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- LICENSE +21 -0
- README.md +0 -0
- config.json +0 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
- deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
- deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
- deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
- deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
- deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
- deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
- deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
- deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
- deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
- deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
LICENSE
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
MIT License
|
2 |
+
|
3 |
+
Copyright (c) 2023 DeepSeek
|
4 |
+
|
5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
6 |
+
of this software and associated documentation files (the "Software"), to deal
|
7 |
+
in the Software without restriction, including without limitation the rights
|
8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9 |
+
copies of the Software, and to permit persons to whom the Software is
|
10 |
+
furnished to do so, subject to the following conditions:
|
11 |
+
|
12 |
+
The above copyright notice and this permission notice shall be included in all
|
13 |
+
copies or substantial portions of the Software.
|
14 |
+
|
15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
21 |
+
SOFTWARE.
|
README.md
ADDED
File without changes
|
config.json
ADDED
File without changes
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:223f8c7e295b02d403dcf3d0ebd17d7b7a0aae140dd075923ec5e60bd12cdd69
|
3 |
+
size 1477
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44d2180d888cc778b11c2594738d8431b1c8d8418dfe4694662b8ccabd89028c
|
3 |
+
size 212761
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cbb55e5348955e7d7596a861e4e99f6264bbdeba38b914ec4d47eb84dfabffa
|
3 |
+
size 6859931648
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d91915040cfac999d8c55f4b5bc6e67367c065e3a7a4e4b9438ce1f256addd86
|
3 |
+
size 17209530
|
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dd0191e04767e4bb08ded463e8cfc118ec5089c442a38e0c8221bff425f2e7b
|
3 |
+
size 52921
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fce7201d5299760db0a212953ea963f35f7d5ebf171a11d1b75efb5f080af147
|
3 |
+
size 1525
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e9499a79a6204f3276dea9a5d8d9a35123036af938b0117b8a1ca9f857cb13a
|
3 |
+
size 284037
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e8fcf924a0ae90140c0099f6c55d5aa8a8259810185afc2e2c33b0a527c488f
|
3 |
+
size 5306130432
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d91915040cfac999d8c55f4b5bc6e67367c065e3a7a4e4b9438ce1f256addd86
|
3 |
+
size 17209530
|
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dd0191e04767e4bb08ded463e8cfc118ec5089c442a38e0c8221bff425f2e7b
|
3 |
+
size 52921
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc87bc52132e57d152c937c72394cdfb9d202ee3a9ea1a1c2769588f1e59dc5f
|
3 |
+
size 1477
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:905c518a61d91d39bc624d17edefcf9c4dedba0e9dae4a1949c3af8ea53fc851
|
3 |
+
size 196782
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31729113e4cb78c0ca74137eb5c1ff3911c24d5097c795eba4a018fe981a8a47
|
3 |
+
size 1965914112
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
|
3 |
+
size 6754
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0b37e684b7809280ea6f94304d95e7cce3df3e93d5f148db79b897e7cc893c6
|
3 |
+
size 1525
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63196cbdd6340502f90a07cea6b07447208d0bfa87f29921d56eb900f01e87cf
|
3 |
+
size 281689
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28262bc2d208413b3dd3189df4aa238c098dcc6e0dc1de7e0c37745fd2a2f5df
|
3 |
+
size 1368849408
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
|
3 |
+
size 6754
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94acba632247c6733b9a01c7fad5ed377a2be2435576d87c19e2e3c1d3c8f7ee
|
3 |
+
size 1477
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9240308a8a7893e729f904084919c18c6fbed160c26c660fc8c563b7bc97520
|
3 |
+
size 336374
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:590668a880e7255a6883bc0b119a95721a662c6d61639339d5169c7f7778ea15
|
3 |
+
size 11928883200
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
|
3 |
+
size 6754
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf801e1dc0924a3d7bd47ecf41be2c35e525ffd3b474e002e51d0f9eff7b3e4e
|
3 |
+
size 1525
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fb7f7b9ab54f552551f273e799433217316cf6a71d1bde95a64bccb5997df8b
|
3 |
+
size 482575
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b95f91e948ad458bdc2a1e0697fd3e8a84c54b2f9bad0617a40094ae6972bfbf
|
3 |
+
size 9462097920
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
|
3 |
+
size 6754
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8f5900c8ba518e7d73fddfe903cd5b1f9e7b50095d9c7f6c7d4e05045e7ed75
|
3 |
+
size 1477
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc13f1a64185e05e8b9b7bbc333b221720d37c948c1406e188f44980237a51b8
|
3 |
+
size 197432
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c77a01ab0da245da13925b0f92f5f12d76d30fe5b91cf6a2fade666172bcad73
|
3 |
+
size 6667360256
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
|
3 |
+
size 6754
|
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0966761d8b5da58788742cc4b441663ce87b21db3186865812f14ecd15cad7af
|
3 |
+
size 1525
|
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6964501f47433e067091a911260174dedacf2dd6fd372873f428701d9d74cdb1
|
3 |
+
size 282885
|
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:787cfa017ea3caf3e0b255eecdf0e6b0e189cec19b1452b26dc14f2551c6c55f
|
3 |
+
size 5101251584
|
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
|
3 |
+
size 485
|
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
|
3 |
+
size 11422778
|