Commit
·
118914d
1
Parent(s):
6c14c32
Upload Phi-4-reasoning ONNX models
Browse files- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/merges.txt +0 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json +3 -0
- cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/vocab.json +3 -0
- gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- gpu/gpu-int4-rtn-block-32/merges.txt +0 -0
- gpu/gpu-int4-rtn-block-32/model.onnx +3 -0
- gpu/gpu-int4-rtn-block-32/model.onnx.data +3 -0
- gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
- gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
- gpu/gpu-int4-rtn-block-32/vocab.json +3 -0
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f58bf7a843c74acaa47c135d2eeaa10b8c93cd1ab6d1313bec0a8db5ee62769f
|
3 |
+
size 1475
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5398bcc88f945aea1ce42648dbec37b520915d3f41d5fb199cc8002113d58a0c
|
3 |
+
size 265958
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e1f95b2844807d38ea495778b629160c28f981ddbeae3b203d8ed0105f23
|
3 |
+
size 10914451456
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1709cc2511788dd182569aa4071b845ac5df22a9424712dd7e456783be74be3
|
3 |
+
size 570
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98fe258b0c1e42a10a9c3b5692ba081d40c177da924800c4f034ad940f794ff9
|
3 |
+
size 7153246
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44cfcdddd4a037ef37cc426c4c26c3ed6f494f1d82dda3e1f73ff9efccfa0878
|
3 |
+
size 19176
|
cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/vocab.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23b80b3c4932a7733eb91487cb2fdbc56c5bd199a459128f538095a36dad5287
|
3 |
+
size 1612628
|
gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a26e6b15490393865cf5fd7632451c2dc2d4b79b14ff159f337e2296fb66a7f
|
3 |
+
size 1524
|
gpu/gpu-int4-rtn-block-32/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
gpu/gpu-int4-rtn-block-32/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc2038958d9a92310c4fc3727bd51b760bc6aa915bd8d9c897f61070ddfdfc93
|
3 |
+
size 358825
|
gpu/gpu-int4-rtn-block-32/model.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d2e92e8d7d3cbe31e8613a1f8f884eafbae27bf3bcf2bf9646408665f21fa8b
|
3 |
+
size 8993548288
|
gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1709cc2511788dd182569aa4071b845ac5df22a9424712dd7e456783be74be3
|
3 |
+
size 570
|
gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98fe258b0c1e42a10a9c3b5692ba081d40c177da924800c4f034ad940f794ff9
|
3 |
+
size 7153246
|
gpu/gpu-int4-rtn-block-32/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44cfcdddd4a037ef37cc426c4c26c3ed6f494f1d82dda3e1f73ff9efccfa0878
|
3 |
+
size 19176
|
gpu/gpu-int4-rtn-block-32/vocab.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23b80b3c4932a7733eb91487cb2fdbc56c5bd199a459128f538095a36dad5287
|
3 |
+
size 1612628
|