Commit
·
bbaf757
1
Parent(s):
10ec43e
Fix quantized weights
Browse files
config.json
CHANGED
@@ -28,8 +28,7 @@
|
|
28 |
"bits": 4,
|
29 |
"group_size": 128,
|
30 |
"modules_to_not_convert": [
|
31 |
-
"lm_head"
|
32 |
-
"gate"
|
33 |
],
|
34 |
"quant_method": "awq",
|
35 |
"version": "gemm",
|
@@ -44,7 +43,7 @@
|
|
44 |
},
|
45 |
"rope_theta": 1000000.0,
|
46 |
"tie_word_embeddings": false,
|
47 |
-
"torch_dtype": "
|
48 |
"transformers_version": "4.43.1",
|
49 |
"use_cache": false,
|
50 |
"vocab_size": 102400
|
|
|
28 |
"bits": 4,
|
29 |
"group_size": 128,
|
30 |
"modules_to_not_convert": [
|
31 |
+
"lm_head"
|
|
|
32 |
],
|
33 |
"quant_method": "awq",
|
34 |
"version": "gemm",
|
|
|
43 |
},
|
44 |
"rope_theta": 1000000.0,
|
45 |
"tie_word_embeddings": false,
|
46 |
+
"torch_dtype": "float16",
|
47 |
"transformers_version": "4.43.1",
|
48 |
"use_cache": false,
|
49 |
"vocab_size": 102400
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2e439ec16548f043be8f92ff8a959a41b7982f5131e37a4a56bdb311e0a802d
|
3 |
+
size 4996470888
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a9b242bdeb878fa05571ccea91a068ff34b03595303a0a3d9d9712c6df4696d
|
3 |
+
size 4953084576
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:072155109bdd3ee825718e328aa0aec6cfc1beed0e1399ad1182f6f929b8d2b2
|
3 |
+
size 4953084584
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9072b470507f5ddf9ac9ad0cba3747bf3796e4f979cfc444804051624e67a146
|
3 |
+
size 3277554600
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|