Upload folder using huggingface_hub
Browse files
README.md
CHANGED
@@ -106,6 +106,7 @@ with torch.no_grad():
|
|
106 |
model.save_pretrained(save_folder)
|
107 |
|
108 |
# mxfp4
|
|
|
109 |
# model = AutoModelForCausalLM.from_pretrained(save_folder, trust_remote_code=True, torch_dtype=torch.bfloat16, quantization_config=quantization_config)
|
110 |
# model.save_pretrained(save_folder, safe_serialization=True)
|
111 |
```
|
|
|
106 |
model.save_pretrained(save_folder)
|
107 |
|
108 |
# mxfp4
|
109 |
+
from transformers.quantizers.quantizer_mxfp4 import Mxfp4HfQuantizer
|
110 |
# model = AutoModelForCausalLM.from_pretrained(save_folder, trust_remote_code=True, torch_dtype=torch.bfloat16, quantization_config=quantization_config)
|
111 |
# model.save_pretrained(save_folder, safe_serialization=True)
|
112 |
```
|