diff --git a/llmc/compression/quantization/module_utils.py b/llmc/compression/quantization/module_utils.py index a0cb5edf..50508a0a 100644 --- a/llmc/compression/quantization/module_utils.py +++ b/llmc/compression/quantization/module_utils.py @@ -1205,8 +1205,8 @@ def __repr__(self): class SglRealQuantLinear(VllmRealQuantLinear): - def __init__(self, weight, bias, scales, need_pack): - super().__init__(weight, bias, scales, need_pack) + def __init__(self, weight, bias, scales, input_scale, need_pack): + super().__init__(weight, bias, scales, input_scale, need_pack) def __repr__(self): return (