OPEA
/

DeepSeek-R1-int4-sym-gguf-q4-0-inc

Model card Files Files and versions

cicdatopea commited on Feb 12

Commit

ebdfdbf

·

verified ·

1 Parent(s): fcdbc83

Update README.md

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -96,7 +96,7 @@ for n, m in block.named_modules():
   if isinstance(m, (torch.nn.Linear, transformers.modeling_utils.Conv1D)):
     if "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2])<63 :
       device ="cuda:1"
-    elif "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2]) >= 63 and  int(n.split('.')[-2]) < 128
       device = "cuda:2"
     elif "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2]) >= 128 and int(
           n.split('.')[-2]) < 192:
@@ -114,7 +114,7 @@ from auto_round import AutoRound
 autoround = AutoRound(model=model, tokenizer=tokenizer, device_map=device_map,
                        iters=200, batch_size=8, seqlen=512, enable_torch_compile=False)
 autoround.quantize()
-autoround.save_quantized(format="gguf:q4_0", output_dir="tmp_autoround"
 ```
 ## Ethical Considerations and Limitations

   if isinstance(m, (torch.nn.Linear, transformers.modeling_utils.Conv1D)):
     if "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2])<63 :
       device ="cuda:1"
+    elif "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2]) >= 63 and  int(n.split('.')[-2]) < 128:
       device = "cuda:2"
     elif "experts" in n and ("shared_experts" not in n) and int(n.split('.')[-2]) >= 128 and int(
           n.split('.')[-2]) < 192:
 autoround = AutoRound(model=model, tokenizer=tokenizer, device_map=device_map,
                        iters=200, batch_size=8, seqlen=512, enable_torch_compile=False)
 autoround.quantize()
+autoround.save_quantized(format="gguf:q4_0", output_dir="tmp_autoround")
 ```
 ## Ethical Considerations and Limitations