Update README.md
Browse files
README.md
CHANGED
|
@@ -74,7 +74,7 @@ for n, m in model.named_modules():
|
|
| 74 |
elif isinstance(m, torch.nn.Linear) and (not "expert" in n or "shared_experts" in n) and n != "lm_head":
|
| 75 |
layer_config[n] = {"bits": 4}
|
| 76 |
|
| 77 |
-
autoround = AutoRound(model, tokenizer, iters=0, layer_config=layer_config, nsamples=
|
| 78 |
autoround.quantize_and_save("tmp_autoround", format="gguf:q2_k_s")
|
| 79 |
|
| 80 |
|
|
|
|
| 74 |
elif isinstance(m, torch.nn.Linear) and (not "expert" in n or "shared_experts" in n) and n != "lm_head":
|
| 75 |
layer_config[n] = {"bits": 4}
|
| 76 |
|
| 77 |
+
autoround = AutoRound(model, tokenizer, iters=0, layer_config=layer_config, nsamples=4096, dataset="NeelNanda/pile-10k,HuggingFaceH4/ultrachat_200k", seqlen=1024)
|
| 78 |
autoround.quantize_and_save("tmp_autoround", format="gguf:q2_k_s")
|
| 79 |
|
| 80 |
|