openvino device selecrtion

Signed-off-by: vladmandic <mandic00@live.com>
2026-04-11 12:06:42 +02:00 · 2026-04-11 12:06:42 +02:00 · d1a40b3ba7
parent 1e38ff4623
commit d1a40b3ba7
5 changed files with 86 additions and 70 deletions
--- a/installer.py
+++ b/installer.py
@ -706,7 +706,7 @@ def install_ipex():

 def install_openvino():
    t_start = time.time()
-    log.info('OpenVINO: selected')
+    log.info('Backend: OpenVINO')
    os.environ.setdefault('PYTORCH_TRACING_MODE', 'TORCHFX')
    if sys.platform == 'darwin':
        torch_command = os.environ.get('TORCH_COMMAND', 'torch==2.11.0 torchvision==0.26.0')
--- a/modules/devices.py
+++ b/modules/devices.py
@ -123,9 +123,12 @@ def get_gpu_info():
    if not torch.cuda.is_available():
        try:
            if backend == 'openvino':
-                from modules.intel.openvino import get_openvino_device
+                from modules.intel.openvino import get_openvino_device, get_device_list, get_device, get_openvino_capabilities
+                devices = [{ device: f'{get_openvino_device(device)}' } for device in get_device_list()]
                return {
-                    'device': get_openvino_device(), # pylint: disable=used-before-assignment
+                    'active': f'"{get_device()}"',
+                    'capabilities': get_openvino_capabilities(),
+                    'devices': devices,
                    'openvino': get_package_version("openvino"),
                }
            elif backend == 'directml':
@ -325,9 +328,12 @@ def test_fp16():
    if fp16_ok is not None:
        return fp16_ok
    if opts.cuda_dtype != 'FP16': # don't override if the user sets it
-        if sys.platform == "darwin" or backend in {'openvino', 'cpu'}: # override
+        if sys.platform == "darwin" or backend == 'cpu': # override
            fp16_ok = False
            return fp16_ok
+        elif backend == 'openvino':
+            from modules.intel.openvino import test_openvino_fp16
+            fp16_ok = test_openvino_fp16()
        elif backend == 'rocm':
            # gfx1102 (RX 7600, 7500, 7650 and 7700S) causes segfaults with fp16
            # agent can be overriden to gfx1100 to get gfx1102 working with ROCm so check the gpu name as well
@ -356,9 +362,12 @@ def test_bf16():
    if bf16_ok is not None:
        return bf16_ok
    if opts.cuda_dtype != 'BF16': # don't override if the user sets it
-        if sys.platform == "darwin" or backend in {'openvino', 'directml', 'cpu'}: # override
+        if sys.platform == "darwin" or backend in {'directml', 'cpu'}: # override
            bf16_ok = False
            return bf16_ok
+        elif backend == 'openvino':
+            from modules.intel.openvino import test_openvino_bf16
+            bf16_ok = test_openvino_bf16()
        elif backend == 'rocm' or backend == 'zluda':
            agent = None
            if backend == 'rocm':
--- a/modules/intel/openvino/init.py
+++ b/modules/intel/openvino/init.py
@ -1,30 +1,30 @@
 import os
-import torch

-from openvino.frontend.pytorch.torchdynamo.partition import Partitioner
-from openvino.frontend.pytorch.fx_decoder import TorchFXPythonDecoder
+from types import MappingProxyType
+from hashlib import sha256
+
+from openvino.frontend.pytorch.torchdynamo.partition import Partitioner # pylint: disable=no-name-in-module
+from openvino.frontend.pytorch.fx_decoder import TorchFXPythonDecoder # pylint: disable=no-name-in-module
 from openvino.frontend import FrontEndManager # pylint: disable=no-name-in-module
-from openvino import Core, Type, PartialShape, serialize  # pylint: disable=no-name-in-module
+from openvino import Core, Type, PartialShape, serialize  # pylint: disable=no-name-in-module, import-self
 from openvino.properties import hint as ov_hints  # pylint: disable=no-name-in-module

+import torch
 from torch._dynamo.backends.common import fake_tensor_unsupported
 from torch._dynamo.backends.registry import register_backend
 from torch.fx.experimental.proxy_tensor import make_fx
 from torch.fx import GraphModule
 from torch.utils._pytree import tree_flatten

-from types import MappingProxyType
-from hashlib import sha256
-
-import installer
-from modules import shared, devices, sd_models_utils
+from modules import shared, devices
 from modules.logger import log


 # Set default params
+subgraph_type = []
 torch._dynamo.config.cache_size_limit = max(64, torch._dynamo.config.cache_size_limit) # pylint: disable=protected-access
 torch._dynamo.eval_frame.check_if_dynamo_supported = lambda: True # pylint: disable=protected-access
-if hasattr(torch._dynamo.config, "inline_inbuilt_nn_modules"):
+if hasattr(torch._dynamo.config, "inline_inbuilt_nn_modules"): # pylint: disable=protected-access
    torch._dynamo.config.inline_inbuilt_nn_modules = False # pylint: disable=protected-access


@ -56,7 +56,7 @@ if hasattr(torch, "float8_e8m0fnu"):

 warned = False
 def warn_once(msg):
-    global warned
+    global warned # pylint: disable=global-statement
    if not warned:
        log.warning(msg)
        warned = True
@ -86,50 +86,59 @@ class OpenVINOGraphModule(torch.nn.Module):

 def get_device_list():
    core = Core()
-    return core.available_devices
+    available_devices = core.available_devices
+    available_devices.sort(key=lambda d: (0 if "NPU" in d else 1 if "GPU" in d else 2, d)) # priority order: NPU > GPU > CPU
+    return available_devices


 def get_device():
-    if hasattr(shared, "opts") and len(shared.opts.openvino_devices) == 1:
+    if len(shared.opts.openvino_devices) == 1:
        return shared.opts.openvino_devices[0]
-
-    core = Core()
-    if hasattr(shared, "opts") and len(shared.opts.openvino_devices) > 1:
-        device = ""
-        available_devices = shared.opts.openvino_devices.copy()
-        if "CPU" in shared.opts.openvino_devices:
-            available_devices.remove("CPU")
-        for hetero_device in available_devices:
-            device = f"{device},{hetero_device}"
-        if "CPU" in shared.opts.openvino_devices:
-            device = f"{device},CPU"
-        device = f"HETERO:{device[1:]}"
-    elif any(openvino_cpu in cpu_module.lower() for cpu_module in shared.cmd_opts.use_cpu for openvino_cpu in ["openvino", "all"]):
-        device = "CPU"
-    elif shared.cmd_opts.device_id is not None:
-        device = f"GPU.{shared.cmd_opts.device_id}"
-        if device not in core.available_devices:
-            device = "GPU.0" if "GPU.0" in core.available_devices else "GPU" if "GPU" in core.available_devices else "CPU"
-    elif "GPU" in core.available_devices:
-        device = "GPU"
-    elif "GPU.1" in core.available_devices:
-        device = "GPU.1"
-    elif "GPU.0" in core.available_devices:
-        device = "GPU.0"
-    else:
-        device = core.available_devices[-1]
-        warn_once(f"OpenVINO: device={device} no compatible GPU detected")
+    elif len(shared.opts.openvino_devices) > 1:
+        active_device = []
+        for hetero_device in get_device_list():
+            if hetero_device in shared.opts.openvino_devices:
+                if (shared.cmd_opts.device_id is None) or (shared.cmd_opts.device_id in hetero_device):
+                    active_device.append(hetero_device)
+        device = f"HETERO:{','.join(active_device)}" if len(active_device) > 0 else 'auto'
+    else: # len(shared.opts.openvino_devices) == 0
+        device = 'AUTO'
    return device


-def get_openvino_device():
+def get_openvino_device(device=None):
    core = Core()
    try:
-        return core.get_property(get_device(), "FULL_DEVICE_NAME")
+        return core.get_property(device or get_device(), "FULL_DEVICE_NAME")
    except Exception:
        return f"OpenVINO {get_device()}"


+def get_openvino_capabilities(device=None):
+    core = Core()
+    try:
+        capabilities = core.get_property(device or get_device(), "OPTIMIZATION_CAPABILITIES")
+        return capabilities if isinstance(capabilities, list) else []
+    except Exception:
+        return []
+
+
+def test_openvino_fp16():
+    try:
+        capabilities = get_openvino_capabilities()
+        return 'FP16' in capabilities
+    except Exception:
+        return False
+
+
+def test_openvino_bf16():
+    try:
+        capabilities = get_openvino_capabilities()
+        return 'BF16' in capabilities
+    except Exception:
+        return False
+
+
 def cached_model_name(model_hash_str, device, args, cache_root, reversed = False):
    if model_hash_str is None:
        return None
@ -183,7 +192,7 @@ def execute_cached(compiled_model, *args):
    flat_args, _ = tree_flatten(args)
    ov_inputs = [a.detach().cpu().numpy() for a in flat_args]

-    if (shared.compiled_model_state.cn_model == []):
+    if shared.compiled_model_state.cn_model == []:
        ov_inputs.reverse()

    res = compiled_model(ov_inputs)
@ -218,8 +227,8 @@ def openvino_compile(gm: GraphModule, *example_inputs, model_hash_str: str | Non

        if file_name is not None:
            serialize(om, file_name + ".xml", file_name + ".bin")
-            if (shared.compiled_model_state.cn_model != []):
-                f = open(file_name + ".txt", "w")
+            if shared.compiled_model_state.cn_model != []:
+                f = open(file_name + ".txt", "w", encoding="utf-8")
                for input_data in example_inputs:
                    f.write(str(input_data.size()))
                    f.write("\n")
@ -380,21 +389,18 @@ def generate_subgraph_str(tensor):


 def get_subgraph_type(tensor):
-    global subgraph_type
    subgraph_type.append(type(tensor))
    return tensor


@fake_tensor_unsupported
-def openvino_fx(subgraph, example_inputs, options=None):
-    global subgraph_type
-
+def openvino_fx(subgraph, example_inputs, options=None): # pylint: disable=unused-argument
    dont_use_faketensors = False
    executor_parameters = None
    inputs_reversed = False
    maybe_fs_cached_name = None

-    subgraph_type = []
+    subgraph_type.clear()
    subgraph.apply(get_subgraph_type)

    """
@ -433,13 +439,13 @@ def openvino_fx(subgraph, example_inputs, options=None):

        if os.path.isfile(maybe_fs_cached_name + ".xml") and os.path.isfile(maybe_fs_cached_name + ".bin"):
            example_inputs_reordered = []
-            if (os.path.isfile(maybe_fs_cached_name + ".txt")):
-                f = open(maybe_fs_cached_name + ".txt")
+            if os.path.isfile(maybe_fs_cached_name + ".txt"):
+                f = open(maybe_fs_cached_name + ".txt", "r", encoding="utf-8")
                for input_data in example_inputs:
                    shape = f.readline()
-                    if (str(input_data.size()) != shape):
+                    if str(input_data.size()) != shape:
                        for idx1, input_data1 in enumerate(example_inputs):
-                            if (str(input_data1.size()).strip() == str(shape).strip()):
+                            if str(input_data1.size()).strip() == str(shape).strip():
                                example_inputs_reordered.append(example_inputs[idx1])
                example_inputs = example_inputs_reordered

@ -447,7 +453,8 @@ def openvino_fx(subgraph, example_inputs, options=None):
                pass
            else:
                # Delete unused subgraphs
-                subgraph = subgraph.apply(sd_models_utils.convert_to_faketensors)
+                from modules.sd_models_utils import convert_to_faketensors
+                subgraph = subgraph.apply(convert_to_faketensors)
                devices.torch_gc(force=True, reason='openvino')

            # Model is fully supported and already cached. Run the cached OV model directly.
@ -456,13 +463,13 @@ def openvino_fx(subgraph, example_inputs, options=None):
            def _call(*args):
                if (shared.compiled_model_state.cn_model != [] and str(shared.compiled_model_state.cn_model) in maybe_fs_cached_name):
                    args_reordered = []
-                    if (os.path.isfile(maybe_fs_cached_name + ".txt")):
-                        f = open(maybe_fs_cached_name + ".txt")
+                    if os.path.isfile(maybe_fs_cached_name + ".txt"):
+                        f = open(maybe_fs_cached_name + ".txt", "r", encoding="utf-8")
                        for input_data in args:
                            shape = f.readline()
-                            if (str(input_data.size()) != shape):
+                            if str(input_data.size()) != shape:
                                for idx1, input_data1 in enumerate(args):
-                                    if (str(input_data1.size()).strip() == str(shape).strip()):
+                                    if str(input_data1.size()).strip() == str(shape).strip():
                                        args_reordered.append(args[idx1])
                    args = args_reordered

@ -479,7 +486,7 @@ def openvino_fx(subgraph, example_inputs, options=None):
    for node in model.graph.nodes:
        if node.target == torch.ops.aten.mul_.Tensor:
            node.target = torch.ops.aten.mul.Tensor
-        elif node.target == torch.ops.aten._unsafe_index.Tensor:
+        elif node.target == torch.ops.aten._unsafe_index.Tensor: # pylint: disable=protected-access
            node.target = torch.ops.aten.index.Tensor
    with devices.inference_context():
        model.eval()
--- a/modules/memstats.py
+++ b/modules/memstats.py
@ -105,7 +105,7 @@ def gpu_stats():
        gpu['used'] = 0
        gpu['error'] = str(e)
        if not fail_once:
-            log.warning(f'GPU stats: {e}')
+            # log.warning(f'GPU stats: {e}')
            # errors.display(e, 'GPU stats')
            fail_once = True
    return gpu
--- a/modules/ui_definitions.py
+++ b/modules/ui_definitions.py
@ -180,7 +180,7 @@ def create_settings(cmd_opts):
    options_templates.update(options_section(('vae_encoder', "Variational Auto Encoder"), {
        "sd_vae": OptionInfo("Automatic", "VAE model", gr.Dropdown, lambda: {"choices": shared_items.sd_vae_items()}, refresh=shared_items.refresh_vae_list),
        "diffusers_vae_upcast": OptionInfo("default", "VAE upcasting", gr.Radio, {"choices": ['default', 'true', 'false']}),
-        "no_half_vae": OptionInfo(False if not cmd_opts.use_openvino else True, "Full precision (--no-half-vae)"),
+        "no_half_vae": OptionInfo(False, "Full precision (--no-half-vae)"),
        "diffusers_vae_slicing": OptionInfo(True, "VAE slicing", gr.Checkbox),
        "diffusers_vae_tiling": OptionInfo(cmd_opts.lowvram, "VAE tiling", gr.Checkbox),
        "diffusers_vae_tile_size": OptionInfo(0, "VAE tile size", gr.Slider, {"minimum": 0, "maximum": 4096, "step": 8 }),
@ -208,7 +208,7 @@ def create_settings(cmd_opts):
        "math_sep": OptionInfo("<h2>Execution Precision</h2>", "", gr.HTML),
        "precision": OptionInfo("Autocast", "Precision type", gr.Radio, {"choices": ["Autocast", "Full"], "visible": False}),
        "cuda_dtype": OptionInfo("Auto", "Device precision type", gr.Radio, {"choices": ["Auto", "FP32", "FP16", "BF16"]}),
-        "no_half": OptionInfo(False if not cmd_opts.use_openvino else True, "Force full precision (--no-half)", None, None, None),
+        "no_half": OptionInfo(False, "Force full precision (--no-half)", None, None, None),
        "upcast_sampling": OptionInfo(False if sys.platform != "darwin" else True, "Upcast sampling", gr.Checkbox, {"visible": False}),

        "generator_sep": OptionInfo("<h2>Noise Options</h2>", "", gr.HTML),
@ -265,10 +265,10 @@ def create_settings(cmd_opts):
        "ipex_optimize": OptionInfo([], "IPEX Optimize", gr.CheckboxGroup, {"choices": ["Model", "TE", "VAE", "Upscaler"], "visible": devices.backend == "ipex"}),

        "openvino_sep": OptionInfo("<h2>OpenVINO</h2>", "", gr.HTML, {"visible": cmd_opts.use_openvino}),
-        "openvino_devices": OptionInfo([], "OpenVINO devices to use", gr.CheckboxGroup, {"choices": get_openvino_device_list() if cmd_opts.use_openvino else [], "visible": cmd_opts.use_openvino}),
+        "openvino_devices": OptionInfo([], "OpenVINO device", gr.CheckboxGroup, {"choices": get_openvino_device_list() if cmd_opts.use_openvino else [], "visible": cmd_opts.use_openvino}),
        "openvino_accuracy": OptionInfo("default", "OpenVINO accuracy mode", gr.Radio, {"choices": ["default", "performance", "accuracy"], "visible": cmd_opts.use_openvino}),
        "openvino_disable_model_caching": OptionInfo(True, "OpenVINO disable model caching", gr.Checkbox, {"visible": cmd_opts.use_openvino}),
-        "openvino_disable_memory_cleanup": OptionInfo(True, "OpenVINO disable memory cleanup after compile", gr.Checkbox, {"visible": cmd_opts.use_openvino}),
+        "openvino_disable_memory_cleanup": OptionInfo(True, "OpenVINO disable memory cleanup", gr.Checkbox, {"visible": cmd_opts.use_openvino}),

        "directml_sep": OptionInfo("<h2>DirectML</h2>", "", gr.HTML, {"visible": devices.backend == "directml"}),
        "directml_memory_provider": OptionInfo(default_memory_provider, "DirectML memory stats provider", gr.Radio, {"choices": memory_providers, "visible": devices.backend == "directml"}),