add full f16 gguf and quantized versions
Browse filesAdds the fully `f16` precision model converted to `.gguf` and the two quantized versions (i.e., the `Q1_3` and `Q2_2`).
- .gitattributes +3 -0
- model_f16.gguf +3 -0
- model_quant_Q1_3.gguf +3 -0
- model_quant_Q2_2.gguf +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
model_f16.gguf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
model_quant_Q1_3.gguf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
model_quant_Q2_2.gguf filter=lfs diff=lfs merge=lfs -text
|
model_f16.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fc35e25de3315d5c5f7e2f8e4d09af4cfd84c66b12a9927c64d9640195d935c
|
3 |
+
size 6650487168
|
model_quant_Q1_3.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93397569b7562df531d823defc54749ba81046568f3ff29c3db87be41f9c81b4
|
3 |
+
size 765841184
|
model_quant_Q2_2.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0b04449fabec0ef2ce39fb311c4e203e50f06a2e81f3d6764f7c5869fb24a38
|
3 |
+
size 916849184
|