diff --git a/quantize_awq.py b/quantize_awq.py index 746c43d..c065160 100644 --- a/quantize_awq.py +++ b/quantize_awq.py @@ -9,6 +9,12 @@ Uses domain calibration data from substrate_v5.jsonl. import json import torch from transformers import AutoModelForCausalLM, AutoTokenizer + +# Qwen3.6-27B uses Qwen3_5ForConditionalGeneration which AutoRound +# misidentifies as a multimodal model. Patch before importing AutoRound. +import auto_round.autoround as _ar +_ar.is_mllm_model = lambda *a, **kw: False + from auto_round import AutoRound MODEL = "/workspace/substrate-qwen36-27b-merged"