InternLM · lingyezhixing · Apr 6, 2026 · Copilot · Apr 8, 2026
diff --git a/lmdeploy/turbomind/deploy/parameter.py b/lmdeploy/turbomind/deploy/parameter.py
@@ -97,7 +97,10 @@ def __call__(self, f, g, i):
         scales = self._get(g, 'scales')
         f(i, scales, 'scales', to_half, apply_gs=['w2'])
         if self.compressed_tensors and not self.has_zero_point:
-            zeros = generate_zero_point(scales)
+            if scales is not None and all(s is not None for s in scales):
+                zeros = generate_zero_point(scales)
+            else:
+                zeros = scales
         else:
             zeros = self._get(g, 'qzeros')
         f(i, zeros, 'zeros', to_half, apply_gs=['w2'])