Skip to content
This repository was archived by the owner on Oct 25, 2024. It is now read-only.

Commit dbd809b

Browse files
authored
Adapt INCWeightOnlyLinear (#1686)
Signed-off-by: Kaihui-intel <[email protected]>
1 parent 03875a1 commit dbd809b

File tree

3 files changed

+3
-2
lines changed

3 files changed

+3
-2
lines changed

Diff for: intel_extension_for_transformers/transformers/llm/quantization/utils.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323
from ....tools.utils import _ipex_version
2424
from accelerate import init_empty_weights
2525
from datasets import load_dataset
26-
from neural_compressor.torch.algorithms.weight_only.modules import WeightOnlyLinear
26+
from neural_compressor.torch.algorithms.weight_only.modules import INCWeightOnlyLinear as WeightOnlyLinear
2727
from neural_compressor.torch.quantization import (
2828
AutoRoundConfig,
2929
AWQConfig,

Diff for: intel_extension_for_transformers/transformers/modeling/modeling_auto.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@
7070
from ...tools.utils import is_intel_gpu_available, is_ipex_available, _neural_compressor_version
7171
from accelerate import init_empty_weights
7272
from huggingface_hub import hf_hub_download
73-
from neural_compressor.torch.algorithms.weight_only.modules import WeightOnlyLinear
73+
from neural_compressor.torch.algorithms.weight_only.modules import INCWeightOnlyLinear as WeightOnlyLinear
7474
from neural_compressor.model.torch_model import PyTorchFXModel
7575
from packaging import version
7676
from threading import Thread

Diff for: tests/requirements.txt

+1
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,7 @@ intel-tensorflow==2.14.0
1515
lm-eval==0.4.3
1616
mlflow
1717
nlpaug==1.1.9
18+
nltk==3.8.1
1819
onnx
1920
onnxruntime
2021
peft==0.6.2

0 commit comments

Comments
 (0)