Skip to content

Commit 210d5af

Browse files
committed
fix
1 parent ccc6294 commit 210d5af

File tree

3 files changed

+3
-5
lines changed

3 files changed

+3
-5
lines changed

optimum/commands/export/openvino.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
from typing import TYPE_CHECKING, Optional
2121

2222
from huggingface_hub.constants import HUGGINGFACE_HUB_CACHE
23-
from transformers.utils.quantization_config import QuantizationMethod
2423

2524
from ...exporters import TasksManager
2625
from ...intel.utils.import_utils import DIFFUSERS_IMPORT_ERROR, is_diffusers_available
@@ -289,7 +288,7 @@ def _get_default_int4_config(model_id_or_path, library_name):
289288
"all_layers": None if is_int8 else self.args.all_layers,
290289
"dataset": self.args.dataset,
291290
"num_samples": self.args.num_samples,
292-
"quant_method": QuantizationMethod.AWQ if self.args.awq else None,
291+
"quant_method": "awq" if self.args.awq else "default",
293292
"sensitivity_metric": self.args.sensitivity_metric,
294293
"scale_estimation": self.args.scale_estimation,
295294
}

optimum/intel/openvino/configuration.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -200,7 +200,7 @@ def __init__(
200200
sensitivity_metric: Optional[str] = None,
201201
ignored_scope: Optional[dict] = None,
202202
num_samples: Optional[int] = None,
203-
quant_method: Union[QuantizationMethod, OVQuantizationMethod] = OVQuantizationMethod.DEFAULT,
203+
quant_method: Union[str, QuantizationMethod, OVQuantizationMethod] = OVQuantizationMethod.DEFAULT,
204204
scale_estimation: bool = None,
205205
**kwargs,
206206
):

optimum/intel/openvino/quantization.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,6 @@
3838
from transformers import AutoTokenizer, DataCollator, PreTrainedModel, default_data_collator
3939
from transformers.pytorch_utils import Conv1D
4040
from transformers.utils import is_accelerate_available
41-
from transformers.utils.quantization_config import QuantizationMethod
4241

4342
from optimum.exporters.onnx.convert import check_dummy_inputs_are_allowed
4443
from optimum.exporters.tasks import TasksManager
@@ -828,7 +827,7 @@ def _weight_only_quantization(
828827
group_size=config.group_size,
829828
all_layers=config.all_layers,
830829
sensitivity_metric=sensitivity_metric,
831-
awq=config.quant_method.lower() == "awq",
830+
awq=getattr(config.quant_method, "name", "") == "AWQ",
832831
ignored_scope=config.get_ignored_scope_instance(),
833832
dataset=dataset,
834833
subset_size=config.num_samples if config.num_samples else 128,

0 commit comments

Comments
 (0)