kvaishnavi commited on
Commit
244ace8
·
1 Parent(s): 2f79652

Upload DeepSeek-R1-Distill ONNX models

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. LICENSE +21 -0
  2. README.md +0 -0
  3. config.json +0 -0
  4. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
  5. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
  6. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
  7. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
  8. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
  9. deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
  10. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
  11. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
  12. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
  13. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
  14. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
  15. deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
  16. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
  17. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
  18. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
  19. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
  20. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
  21. deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
  22. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
  23. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
  24. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
  25. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
  26. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
  27. deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
  28. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
  29. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
  30. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
  31. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
  32. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
  33. deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
  34. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
  35. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
  36. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
  37. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
  38. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
  39. deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
  40. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
  41. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
  42. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
  43. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
  44. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
  45. deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
  46. deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
  47. deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
  48. deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
  49. deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
  50. deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2023 DeepSeek
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
README.md ADDED
File without changes
config.json ADDED
File without changes
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:223f8c7e295b02d403dcf3d0ebd17d7b7a0aae140dd075923ec5e60bd12cdd69
3
+ size 1477
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44d2180d888cc778b11c2594738d8431b1c8d8418dfe4694662b8ccabd89028c
3
+ size 212761
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cbb55e5348955e7d7596a861e4e99f6264bbdeba38b914ec4d47eb84dfabffa
3
+ size 6859931648
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91915040cfac999d8c55f4b5bc6e67367c065e3a7a4e4b9438ce1f256addd86
3
+ size 17209530
deepseek-r1-distill-llama-8B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dd0191e04767e4bb08ded463e8cfc118ec5089c442a38e0c8221bff425f2e7b
3
+ size 52921
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce7201d5299760db0a212953ea963f35f7d5ebf171a11d1b75efb5f080af147
3
+ size 1525
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e9499a79a6204f3276dea9a5d8d9a35123036af938b0117b8a1ca9f857cb13a
3
+ size 284037
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e8fcf924a0ae90140c0099f6c55d5aa8a8259810185afc2e2c33b0a527c488f
3
+ size 5306130432
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91915040cfac999d8c55f4b5bc6e67367c065e3a7a4e4b9438ce1f256addd86
3
+ size 17209530
deepseek-r1-distill-llama-8B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dd0191e04767e4bb08ded463e8cfc118ec5089c442a38e0c8221bff425f2e7b
3
+ size 52921
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc87bc52132e57d152c937c72394cdfb9d202ee3a9ea1a1c2769588f1e59dc5f
3
+ size 1477
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:905c518a61d91d39bc624d17edefcf9c4dedba0e9dae4a1949c3af8ea53fc851
3
+ size 196782
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31729113e4cb78c0ca74137eb5c1ff3911c24d5097c795eba4a018fe981a8a47
3
+ size 1965914112
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
deepseek-r1-distill-qwen-1.5B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
3
+ size 6754
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0b37e684b7809280ea6f94304d95e7cce3df3e93d5f148db79b897e7cc893c6
3
+ size 1525
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63196cbdd6340502f90a07cea6b07447208d0bfa87f29921d56eb900f01e87cf
3
+ size 281689
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28262bc2d208413b3dd3189df4aa238c098dcc6e0dc1de7e0c37745fd2a2f5df
3
+ size 1368849408
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
deepseek-r1-distill-qwen-1.5B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
3
+ size 6754
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94acba632247c6733b9a01c7fad5ed377a2be2435576d87c19e2e3c1d3c8f7ee
3
+ size 1477
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9240308a8a7893e729f904084919c18c6fbed160c26c660fc8c563b7bc97520
3
+ size 336374
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:590668a880e7255a6883bc0b119a95721a662c6d61639339d5169c7f7778ea15
3
+ size 11928883200
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
deepseek-r1-distill-qwen-14B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
3
+ size 6754
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf801e1dc0924a3d7bd47ecf41be2c35e525ffd3b474e002e51d0f9eff7b3e4e
3
+ size 1525
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fb7f7b9ab54f552551f273e799433217316cf6a71d1bde95a64bccb5997df8b
3
+ size 482575
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b95f91e948ad458bdc2a1e0697fd3e8a84c54b2f9bad0617a40094ae6972bfbf
3
+ size 9462097920
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
deepseek-r1-distill-qwen-14B/gpu/gpu-int4-rtn-block-32/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
3
+ size 6754
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f5900c8ba518e7d73fddfe903cd5b1f9e7b50095d9c7f6c7d4e05045e7ed75
3
+ size 1477
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc13f1a64185e05e8b9b7bbc333b221720d37c948c1406e188f44980237a51b8
3
+ size 197432
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77a01ab0da245da13925b0f92f5f12d76d30fe5b91cf6a2fade666172bcad73
3
+ size 6667360256
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
deepseek-r1-distill-qwen-7B/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b869a935677e8f9dc3896cb69982de89843c1bbff27194eb83542c0e3f82babc
3
+ size 6754
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/genai_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0966761d8b5da58788742cc4b441663ce87b21db3186865812f14ecd15cad7af
3
+ size 1525
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6964501f47433e067091a911260174dedacf2dd6fd372873f428701d9d74cdb1
3
+ size 282885
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787cfa017ea3caf3e0b255eecdf0e6b0e189cec19b1452b26dc14f2551c6c55f
3
+ size 5101251584
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59cda48bbe8bab9d61ffb410e6e3c07b6d98bff73cee7c88ff8b51f95f21ab1c
3
+ size 485
deepseek-r1-distill-qwen-7B/gpu/gpu-int4-rtn-block-32/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778