From 7cd9b09818197fc680ffc314c1e174b3bc01978c Mon Sep 17 00:00:00 2001 From: gushiqiao <77222802+gushiqiao@users.noreply.github.com> Date: Fri, 22 Nov 2024 11:35:00 +0800 Subject: [PATCH] Fix sglang bugs (#220) Co-authored-by: gushiqiao --- llmc/compression/quantization/module_utils.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llmc/compression/quantization/module_utils.py b/llmc/compression/quantization/module_utils.py index a0cb5edf..50508a0a 100644 --- a/llmc/compression/quantization/module_utils.py +++ b/llmc/compression/quantization/module_utils.py @@ -1205,8 +1205,8 @@ def __repr__(self): class SglRealQuantLinear(VllmRealQuantLinear): - def __init__(self, weight, bias, scales, need_pack): - super().__init__(weight, bias, scales, need_pack) + def __init__(self, weight, bias, scales, input_scale, need_pack): + super().__init__(weight, bias, scales, input_scale, need_pack) def __repr__(self): return (