From 31815357bd83c07e782868ed2582385893a0f346 Mon Sep 17 00:00:00 2001 From: eaidova Date: Wed, 4 Dec 2024 09:12:25 +0400 Subject: [PATCH 1/4] import OVQuantizer only if it is required in VLM --- optimum/intel/openvino/modeling_visual_language.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/optimum/intel/openvino/modeling_visual_language.py b/optimum/intel/openvino/modeling_visual_language.py index aa9b23a0ee..8d6edea0f0 100644 --- a/optimum/intel/openvino/modeling_visual_language.py +++ b/optimum/intel/openvino/modeling_visual_language.py @@ -26,7 +26,6 @@ from ...exporters.openvino import main_export from ...exporters.openvino.stateful import ensure_stateful_is_available, model_has_input_output_name from ...exporters.openvino.utils import save_config -from .. import OVQuantizer from .configuration import OVConfig, OVWeightQuantizationConfig from .modeling_base import OVBaseModel, OVModelPart from .modeling_decoder import CausalLMOutputWithPast, OVModelForCausalLM @@ -549,6 +548,8 @@ def _from_pretrained( ) if to_quantize: + from optimum.intel.openvino.quantization import OVQuantizer + quantization_config_copy = copy.deepcopy(quantization_config) quantization_config_copy.tokenizer = quantization_config.tokenizer or model_id potential_processor_id = config.mm_vision_tower if isinstance(model, _OVNanoLlavaForCausalLM) else model_id From e26f516db525bc682672cf424c0e2409673a308b Mon Sep 17 00:00:00 2001 From: eaidova Date: Wed, 4 Dec 2024 13:22:54 +0400 Subject: [PATCH 2/4] do not use TaskManager for getting task constant --- optimum/intel/openvino/modeling.py | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/optimum/intel/openvino/modeling.py b/optimum/intel/openvino/modeling.py index b765d2f9f4..9ee35f3687 100644 --- a/optimum/intel/openvino/modeling.py +++ b/optimum/intel/openvino/modeling.py @@ -50,8 +50,6 @@ XVectorOutput, ) -from optimum.exporters import TasksManager - from ..utils.import_utils import is_timm_available, is_timm_version from .modeling_base import OVBaseModel from .utils import _is_timm_ov_dir @@ -695,7 +693,7 @@ class OVModelForCTC(OVModel): """ auto_model_class = AutoModelForCTC - export_feature = TasksManager.infer_task_from_model(auto_model_class) + export_feature = "automatic-speech-recognition" @add_start_docstrings_to_model_forward( AUDIO_INPUTS_DOCSTRING.format("batch_size, sequence_length") @@ -775,7 +773,7 @@ class OVModelForAudioXVector(OVModel): """ auto_model_class = AutoModelForAudioXVector - export_feature = TasksManager.infer_task_from_model(auto_model_class) + export_feature = "audio-xvector" @add_start_docstrings_to_model_forward( AUDIO_INPUTS_DOCSTRING.format("batch_size, sequence_length") @@ -851,7 +849,7 @@ class OVModelForAudioFrameClassification(OVModel): """ auto_model_class = AutoModelForAudioFrameClassification - export_feature = TasksManager.infer_task_from_model(auto_model_class) + export_feature = "audio-frame-classification" @add_start_docstrings_to_model_forward( AUDIO_INPUTS_DOCSTRING.format("batch_size, sequence_length") From 97e9141109052c6cb8d14d98c16cfacd90aa9aa8 Mon Sep 17 00:00:00 2001 From: eaidova Date: Wed, 4 Dec 2024 13:52:18 +0400 Subject: [PATCH 3/4] avoid import onnx in modeling_base and stateful --- optimum/exporters/openvino/stateful.py | 3 ++- optimum/intel/openvino/modeling_base.py | 4 ++-- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/optimum/exporters/openvino/stateful.py b/optimum/exporters/openvino/stateful.py index 4b4374ab51..39d64c2aec 100644 --- a/optimum/exporters/openvino/stateful.py +++ b/optimum/exporters/openvino/stateful.py @@ -20,7 +20,6 @@ import openvino as ov from openvino.runtime import opset13 -from optimum.exporters import TasksManager from optimum.intel.utils.import_utils import _openvino_version, is_openvino_version, is_transformers_version from .utils import MULTI_MODAL_TEXT_GENERATION_MODELS @@ -192,6 +191,8 @@ def ensure_stateful_is_available(warn=True): def ensure_export_task_support_stateful(task: str): + from optimum.exporters import TasksManager + task = TasksManager.map_from_synonym(task) return task in ["text-generation-with-past"] diff --git a/optimum/intel/openvino/modeling_base.py b/optimum/intel/openvino/modeling_base.py index 3799bf8567..99422f1a54 100644 --- a/optimum/intel/openvino/modeling_base.py +++ b/optimum/intel/openvino/modeling_base.py @@ -30,7 +30,7 @@ from transformers.generation import GenerationMixin from transformers.utils import is_offline_mode -from optimum.exporters.onnx import OnnxConfig +from optimum.exporters.base import ExportConfig from optimum.modeling_base import FROM_PRETRAINED_START_DOCSTRING, OptimizedModel from ...exporters.openvino import export, main_export @@ -623,7 +623,7 @@ def _to_load( cls, model, config: PretrainedConfig, - onnx_config: OnnxConfig, + onnx_config: ExportConfig, token: Optional[Union[bool, str]] = None, revision: Optional[str] = None, force_download: bool = False, From 6f6b24583c5f4a21dc36ad38925d415237b9ef16 Mon Sep 17 00:00:00 2001 From: eaidova Date: Wed, 4 Dec 2024 17:16:37 +0400 Subject: [PATCH 4/4] reduce onnx dependency --- optimum/exporters/openvino/__main__.py | 2 +- optimum/exporters/openvino/convert.py | 24 ++++++++++++++---------- 2 files changed, 15 insertions(+), 11 deletions(-) diff --git a/optimum/exporters/openvino/__main__.py b/optimum/exporters/openvino/__main__.py index 3ac8314889..0f68691634 100644 --- a/optimum/exporters/openvino/__main__.py +++ b/optimum/exporters/openvino/__main__.py @@ -29,7 +29,6 @@ from optimum.exporters import TasksManager from optimum.exporters.onnx.base import OnnxConfig from optimum.exporters.onnx.constants import SDPA_ARCHS_ONNX_EXPORT_NOT_SUPPORTED -from optimum.exporters.openvino.convert import export_from_model from optimum.intel.utils.import_utils import ( is_nncf_available, is_openvino_tokenizers_available, @@ -185,6 +184,7 @@ def main_export( >>> main_export("gpt2", output="gpt2_ov/") ``` """ + from optimum.exporters.openvino.convert import export_from_model if use_auth_token is not None: warnings.warn( diff --git a/optimum/exporters/openvino/convert.py b/optimum/exporters/openvino/convert.py index e4ece9801b..161b9372d5 100644 --- a/optimum/exporters/openvino/convert.py +++ b/optimum/exporters/openvino/convert.py @@ -20,7 +20,6 @@ from pathlib import Path from typing import TYPE_CHECKING, Any, Callable, Dict, List, Optional, Tuple, Union -import onnx from transformers.generation import GenerationMixin from transformers.utils import is_tf_available, is_torch_available @@ -28,10 +27,6 @@ from openvino.runtime.exceptions import OVTypeError from openvino.tools.ovc import convert_model from optimum.exporters import TasksManager -from optimum.exporters.onnx.base import OnnxConfig -from optimum.exporters.onnx.convert import check_dummy_inputs_are_allowed -from optimum.exporters.onnx.convert import export_pytorch as export_pytorch_to_onnx -from optimum.exporters.onnx.convert import export_tensorflow as export_tensorflow_onnx from optimum.exporters.utils import ( _get_submodels_and_export_configs as _default_get_submodels_and_export_configs, ) @@ -89,6 +84,7 @@ if TYPE_CHECKING: + from optimum.exporters.onnx.base import OnnxConfig from optimum.intel.openvino.configuration import OVConfig @@ -111,7 +107,7 @@ def _save_model( path: str, ov_config: Optional["OVConfig"] = None, library_name: Optional[str] = None, - config: OnnxConfig = None, + config: "OnnxConfig" = None, ): compress_to_fp16 = ov_config is not None and ov_config.dtype == "fp16" model = _add_version_info_to_model(model, library_name) @@ -125,7 +121,7 @@ def _save_model( def export( model: Union["PreTrainedModel", "TFPreTrainedModel", "ModelMixin", "DiffusionPipeline"], - config: OnnxConfig, + config: "OnnxConfig", output: Path, opset: Optional[int] = None, device: str = "cpu", @@ -208,7 +204,7 @@ def export( def export_tensorflow( model: Union["PreTrainedModel", "ModelMixin"], - config: OnnxConfig, + config: "OnnxConfig", opset: int, output: Path, ov_config: Optional["OVConfig"] = None, @@ -228,6 +224,8 @@ def export_tensorflow( output_names: list of output names from ONNX configuration bool: True if the model was exported successfully. """ + from optimum.exporters.onnx.convert import export_tensorflow as export_tensorflow_onnx + onnx_path = Path(output).with_suffix(".onnx") input_names, output_names = export_tensorflow_onnx(model, config, opset, onnx_path) ov_model = convert_model(str(onnx_path)) @@ -248,7 +246,7 @@ def export_tensorflow( def export_pytorch_via_onnx( model: Union["PreTrainedModel", "ModelMixin"], - config: OnnxConfig, + config: "OnnxConfig", opset: int, output: Path, device: str = "cpu", @@ -285,6 +283,8 @@ def export_pytorch_via_onnx( """ import torch + from optimum.exporters.onnx.convert import export_pytorch as export_pytorch_to_onnx + output = Path(output) orig_torch_onnx_export = torch.onnx.export torch.onnx.export = functools.partial(orig_torch_onnx_export, do_constant_folding=False) @@ -313,7 +313,7 @@ def export_pytorch_via_onnx( def export_pytorch( model: Union["PreTrainedModel", "ModelMixin"], - config: OnnxConfig, + config: "OnnxConfig", opset: int, output: Path, device: str = "cpu", @@ -355,6 +355,8 @@ def export_pytorch( import torch from torch.utils._pytree import tree_map + from optimum.exporters.onnx.convert import check_dummy_inputs_are_allowed + logger.info(f"Using framework PyTorch: {torch.__version__}") output = Path(output) @@ -869,6 +871,8 @@ def _add_version_info_to_model(model: Model, library_name: Optional[str] = None) model.set_rt_info(_nncf_version, ["optimum", "nncf_version"]) input_model = rt_info["conversion_parameters"].get("input_model", None) if input_model is not None and "onnx" in input_model.value: + import onnx + model.set_rt_info(onnx.__version__, ["optimum", "onnx_version"]) except Exception: