Skip to content

Commit

Permalink
revert change
Browse files Browse the repository at this point in the history
  • Loading branch information
wenhuach21 committed Dec 12, 2024
1 parent 0371849 commit 2511193
Showing 1 changed file with 9 additions and 9 deletions.
18 changes: 9 additions & 9 deletions auto_round/backend.py
Original file line number Diff line number Diff line change
Expand Up @@ -132,15 +132,15 @@ def check_auto_round_exllamav2_installed():
"auto_gptq:tritonv2"],
requirements=["auto-gptq>=0.7.1", "triton<3.0,>=2.0"]
)
#
# BackendInfos['gptq:cuda'] = BackendInfo(device=["cuda"], sym=[True, False],
# packing_format="triton_zp+-1",
# bits=[2, 3, 4, 8], group_size=None,
# priority=1, feature_checks=[feature_multiply_checker_32],
# alias=["auto_round:auto_gptq:cuda,auto_gptq:cuda, auto_round:gptq:cuda"],
# convertable_format=["triton_zp+-1"],
# requirements=["auto-gptq>=0.7.1"]
# )

BackendInfos['gptq:cuda'] = BackendInfo(device=["cuda"], sym=[True, False],
packing_format="triton_zp+-1",
bits=[2, 3, 4, 8], group_size=None,
priority=1, feature_checks=[feature_multiply_checker_32],
alias=["auto_round:auto_gptq:cuda,auto_gptq:cuda, auto_round:gptq:cuda"],
convertable_format=["triton_zp+-1"],
requirements=["auto-gptq>=0.7.1"]
)

BackendInfos['awq:gemm'] = BackendInfo(device=["cuda"], sym=[True, False], ##actrally is gemm
packing_format="awq",
Expand Down

0 comments on commit 2511193

Please sign in to comment.