From 72e691a385025950053bb1c665f6f208ec1814bd Mon Sep 17 00:00:00 2001 From: Xin He Date: Thu, 9 Apr 2026 21:31:13 +0800 Subject: [PATCH] quick fix: gptqmodel no longer have gptqmodel_marlin_kernels --- auto_round_extension/cuda/gptqmodel_marlin.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/auto_round_extension/cuda/gptqmodel_marlin.py b/auto_round_extension/cuda/gptqmodel_marlin.py index 144209b08..d96e04f62 100644 --- a/auto_round_extension/cuda/gptqmodel_marlin.py +++ b/auto_round_extension/cuda/gptqmodel_marlin.py @@ -54,7 +54,10 @@ def get_marlin_layer(): ##use an ugly wrapper to import gptqmodel on demand try: import gptqmodel_marlin_kernels # pylint: disable=E0401 except ImportError as e: - marlin_import_exception = e + try: + import gptqmodel.utils.marlin as gptqmodel_marlin_kernels # pylint: disable=E0401 + except ImportError as e: + marlin_import_exception = e from auto_round.utils import logger