[moe][quant] add weight name case for offset (#15515)

MengqingCao · web-flow · commit fb22be5817cc · 2025-03-27T04:50:29.000Z
Signed-off-by: Mengqing Cao &lt;cmq0113@163.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py
@@ -699,8 +699,9 @@ def weight_loader(self, param: torch.nn.Parameter,
                              tp_rank=self.tp_rank)
             return
 
-        # Case weight scales and zero_points
-        if ("scale" in weight_name or "zero" in weight_name):
+        # Case weight scales, zero_points and offset
+        if ("scale" in weight_name or "zero" in weight_name
+                or "offset" in weight_name):
             # load the weight scales and zp based on the quantization scheme
             # supported weight scales/zp can be found in
             # FusedMoeWeightScaleSupported