Skip to content

Commit a7f9285

Browse files
committed
rename kernel files
1 parent f45b57c commit a7f9285

File tree

14 files changed

+24
-24
lines changed

14 files changed

+24
-24
lines changed

gptqmodel/looper/awq_processor.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,10 @@
2020
from ..models._const import SUPPORTS_MODULE_TYPES
2121
from ..models.writer import (PROCESS_LOG_LAYER, PROCESS_LOG_MODULE, PROCESS_LOG_NAME,
2222
PROCESS_LOG_TIME, PROCESS_USED_MEMORY, QUANT_LOG_LOSS, QUANT_LOG_NSAMPLES)
23-
from ..nn_modules.qlinear.awq_gemm import AwqGEMMQuantLinear
24-
from ..nn_modules.qlinear.awq_gemv import AwqGEMVQuantLinear
25-
from ..nn_modules.qlinear.awq_gemv_fast import AwqGEMVFastQuantLinear
26-
from ..nn_modules.qlinear.awq_marlin import AwqMarlinQuantLinear
23+
from ..nn_modules.qlinear.gemm_awq import AwqGEMMQuantLinear
24+
from ..nn_modules.qlinear.gemv_awq import AwqGEMVQuantLinear
25+
from ..nn_modules.qlinear.gemv_fast_awq import AwqGEMVFastQuantLinear
26+
from ..nn_modules.qlinear.marlin_awq import AwqMarlinQuantLinear
2727
from ..quantization.awq.modules.linear import WQLinear_GEMM, WQLinear_GEMV, WQLinear_GEMVFast, WQLinear_Marlin
2828
from ..quantization.awq.quantize.scale import apply_clip, apply_scale
2929
from ..quantization.awq.utils.module import append_str_prefix, get_op_name, get_op_by_name, set_op_by_name

gptqmodel/utils/importer.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -13,14 +13,14 @@
1313

1414
from ..models._const import DEVICE, normalize_device
1515
from ..nn_modules.qlinear import BaseQuantLinear, PackableQuantLinear
16-
from ..nn_modules.qlinear.awq_exllama import AwqExllamaQuantLinear
17-
from ..nn_modules.qlinear.awq_exllamav2 import AwqExllamaV2QuantLinear
18-
from ..nn_modules.qlinear.awq_gemm import AwqGEMMQuantLinear
19-
from ..nn_modules.qlinear.awq_gemv import AwqGEMVQuantLinear
20-
from ..nn_modules.qlinear.awq_gemv_fast import AwqGEMVFastQuantLinear
21-
from ..nn_modules.qlinear.awq_machete import AwqMacheteQuantLinear
22-
from ..nn_modules.qlinear.awq_marlin import AwqMarlinQuantLinear
23-
from ..nn_modules.qlinear.awq_torch import AwqTorchQuantLinear
16+
from ..nn_modules.qlinear.exllama_awq import AwqExllamaQuantLinear
17+
from ..nn_modules.qlinear.exllamav2_awq import AwqExllamaV2QuantLinear
18+
from ..nn_modules.qlinear.gemm_awq import AwqGEMMQuantLinear
19+
from ..nn_modules.qlinear.gemv_awq import AwqGEMVQuantLinear
20+
from ..nn_modules.qlinear.gemv_fast_awq import AwqGEMVFastQuantLinear
21+
from ..nn_modules.qlinear.machete_awq import AwqMacheteQuantLinear
22+
from ..nn_modules.qlinear.marlin_awq import AwqMarlinQuantLinear
23+
from ..nn_modules.qlinear.torch_awq import AwqTorchQuantLinear
2424
from ..nn_modules.qlinear.bitblas import BitBLASQuantLinear
2525
from ..nn_modules.qlinear.exllama import ExllamaQuantLinear
2626
from ..nn_modules.qlinear.exllama_eora import ExllamaEoraQuantLinear

gptqmodel/utils/model.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646
SUPPORTS_MODULE_TYPES,
4747
)
4848
from ..nn_modules.qlinear import BaseQuantLinear
49-
from ..nn_modules.qlinear.awq_exllamav2 import AwqExllamaV2QuantLinear
49+
from ..nn_modules.qlinear.exllamav2_awq import AwqExllamaV2QuantLinear
5050
from ..nn_modules.qlinear.exllama import ExllamaQuantLinear
5151
from ..nn_modules.qlinear.exllamav2 import ExllamaV2QuantLinear
5252
from ..quantization import FORMAT, QuantizeConfig

tests/test_awq.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,11 @@
1515
from parameterized import parameterized
1616
from transformers import AutoTokenizer
1717

18-
from gptqmodel.nn_modules.qlinear.awq_gemm import AwqGEMMQuantLinear
19-
from gptqmodel.nn_modules.qlinear.awq_gemv import AwqGEMVQuantLinear
20-
from gptqmodel.nn_modules.qlinear.awq_gemv_fast import AwqGEMVFastQuantLinear
21-
from gptqmodel.nn_modules.qlinear.awq_machete import AwqMacheteQuantLinear
22-
from gptqmodel.nn_modules.qlinear.awq_marlin import AwqMarlinQuantLinear
18+
from gptqmodel.nn_modules.qlinear.gemm_awq import AwqGEMMQuantLinear
19+
from gptqmodel.nn_modules.qlinear.gemv_awq import AwqGEMVQuantLinear
20+
from gptqmodel.nn_modules.qlinear.gemv_fast_awq import AwqGEMVFastQuantLinear
21+
from gptqmodel.nn_modules.qlinear.machete_awq import AwqMacheteQuantLinear
22+
from gptqmodel.nn_modules.qlinear.marlin_awq import AwqMarlinQuantLinear
2323
from gptqmodel.quantization import FORMAT, METHOD, QUANT_CONFIG_FILENAME
2424
from gptqmodel.utils.machete import _validate_machete_device_support, machete_import_exception
2525

0 commit comments

Comments
 (0)