diff --git a/quantize_awq.py b/quantize_awq.py index c065160..c193afc 100644 --- a/quantize_awq.py +++ b/quantize_awq.py @@ -46,10 +46,9 @@ rounder = AutoRound( dataset=calib, bits=4, group_size=128, - seqlen=2048, + seqlen=512, nsamples=min(128, len(calib)), iters=200, - format="auto_round", ) print("Running AutoRound INT4 quantization...")