Upload optimized ONNX models w/ GQA
#10
by
Xenova
HF Staff
- opened
- onnx/model.onnx +2 -2
- onnx/model_bnb4.onnx +3 -0
- onnx/model_fp16.onnx +2 -2
- onnx/model_int8.onnx +3 -0
- onnx/model_q4.onnx +2 -2
- onnx/model_q4f16.onnx +2 -2
- onnx/model_quantized.onnx +3 -0
- onnx/model_uint8.onnx +3 -0
onnx/model.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e790f1d6fac94097a6516ed1f07c29049097271d536d538562cd31ffc011a71
|
3 |
+
size 540345794
|
onnx/model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc32b446540fe380adb6b29c7e95b0a8402c9e6addb948307daee99735a776bb
|
3 |
+
size 175434623
|
onnx/model_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e85e706ce14a3499e1f698c0d638b430df75b5f67131d1516bd0d46b844dfb2e
|
3 |
+
size 270267067
|
onnx/model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7c33f9ef85d06734cc9d1f943f7e2ba57c77e769df727f4d3e217d9f672b0cc
|
3 |
+
size 137147867
|
onnx/model_q4.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:933577110303a2964096d19b6f15d3b4639bef7f99481ac0b61d9f3ad72f392a
|
3 |
+
size 182068553
|
onnx/model_q4f16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9358cd4ce037c304621f8c194a525607ae7c5ea73239fcae4c21bd02f2e34ff7
|
3 |
+
size 117691126
|
onnx/model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecc1a19eece6494e2963cf74f78ace35916e8d0b803168ddd41db00979f18e39
|
3 |
+
size 137147981
|
onnx/model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecc1a19eece6494e2963cf74f78ace35916e8d0b803168ddd41db00979f18e39
|
3 |
+
size 137147981
|