fix: patch is_mllm_model for Qwen3.6 text-only model
AutoRound misidentifies Qwen3_5ForConditionalGeneration as a VLM and tries to load a vision processor. Patch to force LLM mode.
This commit is contained in:
@@ -9,6 +9,12 @@ Uses domain calibration data from substrate_v5.jsonl.
|
|||||||
import json
|
import json
|
||||||
import torch
|
import torch
|
||||||
from transformers import AutoModelForCausalLM, AutoTokenizer
|
from transformers import AutoModelForCausalLM, AutoTokenizer
|
||||||
|
|
||||||
|
# Qwen3.6-27B uses Qwen3_5ForConditionalGeneration which AutoRound
|
||||||
|
# misidentifies as a multimodal model. Patch before importing AutoRound.
|
||||||
|
import auto_round.autoround as _ar
|
||||||
|
_ar.is_mllm_model = lambda *a, **kw: False
|
||||||
|
|
||||||
from auto_round import AutoRound
|
from auto_round import AutoRound
|
||||||
|
|
||||||
MODEL = "/workspace/substrate-qwen36-27b-merged"
|
MODEL = "/workspace/substrate-qwen36-27b-merged"
|
||||||
|
|||||||
Reference in New Issue
Block a user