Intel
/

DeepSeek-R1-0528-q2ks-mixed-ar

Model card Files Files and versions

wenhuach commited on 12 days ago

Commit

96c8a95

·

verified ·

1 Parent(s): 192f089

Update README.md

Files changed (1) hide show

README.md +1 -1

README.md CHANGED Viewed

@@ -395,7 +395,7 @@ for n, m in model.named_modules():
     elif isinstance(m, torch.nn.Linear) and (not "expert" in n or "shared_experts" in n) and n != "lm_head":
         layer_config[n] = {"bits": 4}
-autoround = AutoRound(model, tokenizer, iters=0, layer_config=layer_config, batch_size=8, nsamples=512)
 autoround.quantize_and_save("/models/DeepSeek-R1-0528-q2ks", format="gguf:q2_k_s")
 ```

     elif isinstance(m, torch.nn.Linear) and (not "expert" in n or "shared_experts" in n) and n != "lm_head":
         layer_config[n] = {"bits": 4}
+autoround = AutoRound(model, tokenizer, iters=0, layer_config=layer_config, batch_size=8, nsamples=512, low_gpu_mem_usage=True)
 autoround.quantize_and_save("/models/DeepSeek-R1-0528-q2ks", format="gguf:q2_k_s")
 ```