1+ from __future__ import annotations
2+
3+ from typing import TYPE_CHECKING
4+
15import torch
2- from transformers import Qwen3VLMoeConfig , Qwen3VLMoeTextConfig
3- from transformers .models .qwen3_vl_moe .modeling_qwen3_vl_moe import (
4- Qwen3VLMoeTextSparseMoeBlock as OriginalQwen3VLMoeTextSparseMoeBlock ,
5- )
66
77from llmcompressor .modeling .moe_context import MoECalibrationModule
88from llmcompressor .utils .dev import skip_weights_initialize
99
10+ if TYPE_CHECKING :
11+ from transformers import Qwen3VLMoeConfig , Qwen3VLMoeTextConfig
12+ from transformers .models .qwen3_vl_moe .modeling_qwen3_vl_moe import (
13+ Qwen3VLMoeTextSparseMoeBlock ,
14+ )
15+
1016
1117@MoECalibrationModule .register ("Qwen3VLMoeTextSparseMoeBlock" )
1218class CalibrateQwen3VLMoeTextSparseMoeBlock (MoECalibrationModule ):
@@ -19,7 +25,7 @@ class CalibrateQwen3VLMoeTextSparseMoeBlock(MoECalibrationModule):
1925
2026 def __init__ (
2127 self ,
22- original : OriginalQwen3VLMoeTextSparseMoeBlock ,
28+ original : Qwen3VLMoeTextSparseMoeBlock ,
2329 config : Qwen3VLMoeConfig ,
2430 calibrate_all_experts : bool ,
2531 ):
@@ -116,7 +122,7 @@ def __init__(self, config, original):
116122
117123def replace (
118124 config : Qwen3VLMoeConfig ,
119- original : OriginalQwen3VLMoeTextSparseMoeBlock ,
125+ original : Qwen3VLMoeTextSparseMoeBlock ,
120126 calibrate_all_experts : bool ,
121127):
122128 return CalibrateQwen3VLMoeTextSparseMoeBlock (
0 commit comments