From 934be8ce483f7a2dc31d2f6660fc0ff3a840c615 Mon Sep 17 00:00:00 2001 From: marauder-actual Date: Mon, 1 Jun 2026 04:16:32 +0200 Subject: [PATCH] fix: load tokenizer from base repo for quant venv compat Merged model has tokenizer_class=TokenizersBackend (transformers 5.x) which is unknown to transformers 4.57.6 in the quant venv. --- quantize_awq.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/quantize_awq.py b/quantize_awq.py index 53c1bfe..77032d7 100644 --- a/quantize_awq.py +++ b/quantize_awq.py @@ -13,9 +13,13 @@ from llmcompressor import oneshot MODEL = "/workspace/substrate-qwen36-27b-merged" OUTPUT = "/workspace/substrate-qwen36-27b-awq" CALIB_DATA = "/workspace/substrate_v5.jsonl" +# Merged model was saved with transformers 5.5.0 which writes +# tokenizer_class=TokenizersBackend — unknown to 4.57.6 in the quant venv. +# Load tokenizer from original repo (has standard class name). +TOKENIZER_SOURCE = "Qwen/Qwen3.6-27B" print("Loading tokenizer...") -tokenizer = AutoTokenizer.from_pretrained(MODEL) +tokenizer = AutoTokenizer.from_pretrained(TOKENIZER_SOURCE) print("Loading model...") model = AutoModelForCausalLM.from_pretrained(