pytorch · cavusmustafa · Oct 27, 2025 · Oct 27, 2025 · Oct 27, 2025 · Oct 27, 2025
diff --git a/backends/openvino/README.md b/backends/openvino/README.md
@@ -109,9 +109,9 @@ Follow the steps below to setup your build environment:
      ```bash
    ./openvino_build.sh --cpp_runtime
    ```
-   **Build C++ Llama Runner**: First, ensure the C++ runtime libraries are built by following the earlier instructions. Then, run the `openvino_build.sh` script with the `--llama_runner flag` to compile the LlaMA runner as shown the below command, which enables executing inference with models exported using export_llama. The resulting binary is located at: `<executorch_root>/cmake-out/examples/models/llama/llama_main`
+   **Build C++ Runtime Libraries with LLM Extension**: Run the `openvino_build.sh` script with the `--cpp_runtime_llm` flag to build the C++ runtime libraries with LLM extension as shown in the below command. Use this option instead of `--cpp_runtime` for LLM extension support which is required by LLM examples.
      ```bash
-   ./openvino_build.sh --llama_runner
+   ./openvino_build.sh --cpp_runtime_llm
    ```
 
 For more information about ExecuTorch environment setup, refer to the [Environment Setup](https://pytorch.org/executorch/main/getting-started-setup#environment-setup) guide.

diff --git a/backends/openvino/requirements.txt b/backends/openvino/requirements.txt
@@ -1,2 +1 @@
-transformers
 git+https://github.com/openvinotoolkit/nncf@3d753ac#egg=nncf
diff --git a/backends/openvino/scripts/openvino_build.sh b/backends/openvino/scripts/openvino_build.sh
@@ -7,69 +7,55 @@ set -e
 EXECUTORCH_ROOT=$(realpath "$(dirname "$0")/../../..")
 echo EXECUTORCH_ROOT=${EXECUTORCH_ROOT}
 
+# Enter the Executorch root directory
+cd "$EXECUTORCH_ROOT"
+
 install_requirements() {
     echo "Installing Requirements For OpenVINO Backend"
-    cd "$EXECUTORCH_ROOT"
     pip install -r backends/openvino/requirements.txt
 }
 
 build_cpp_runtime() {
     echo "Building C++ Runtime Libraries"
 
+    local llm_enabled=${1:-0}
+
     # Set build directory
     local build_dir="cmake-out"
 
-    # Enter the Executorch root directory
-    cd "$EXECUTORCH_ROOT"
     rm -rf "${build_dir}"
 
+    CMAKE_ARGS=(
+        "-DCMAKE_BUILD_TYPE=Release"
+        "-DEXECUTORCH_BUILD_OPENVINO=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_DATA_LOADER=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_MODULE=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_NAMED_DATA_MAP=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_RUNNER_UTIL=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_FLAT_TENSOR=ON"
+        "-DEXECUTORCH_BUILD_EXTENSION_TENSOR=ON"
+        "-DEXECUTORCH_BUILD_EXECUTOR_RUNNER=ON"
+        "-DEXECUTORCH_BUILD_KERNELS_QUANTIZED=ON"
+    )
+
+    if [[ "$llm_enabled" -eq 1 ]]; then
+	    CMAKE_ARGS+=("-DEXECUTORCH_BUILD_EXTENSION_LLM=ON -DEXECUTORCH_BUILD_EXTENSION_LLM_RUNNER=ON")
+    fi
+
     # Configure the project with CMake
     # Note: Add any additional configuration options you need here
     cmake -DCMAKE_INSTALL_PREFIX="${build_dir}" \
-          -DCMAKE_BUILD_TYPE=Release \
-          -DEXECUTORCH_BUILD_OPENVINO=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_DATA_LOADER=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_MODULE=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_NAMED_DATA_MAP=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_RUNNER_UTIL=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_FLAT_TENSOR=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_TENSOR=ON \
-          -DEXECUTORCH_BUILD_EXECUTOR_RUNNER=ON \
-          -DEXECUTORCH_BUILD_KERNELS_QUANTIZED=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_LLM=ON \
-          -DEXECUTORCH_BUILD_EXTENSION_LLM_RUNNER=ON \
+          ${CMAKE_ARGS[@]} \
           -B"${build_dir}"
 
-
     # Build the project
     cmake --build ${build_dir} --target install --config Release -j$(nproc)
 }
 
-build_llama_runner() {
-    echo "Building Export Llama Runner"
-
-    # Set build directory
-    local build_dir="cmake-out"
-
-    # Enter the Executorch root directory
-    cd "$EXECUTORCH_ROOT"
-
-    # Configure the project with CMake
-    # Note: Add any additional configuration options you need here
-    cmake -DCMAKE_INSTALL_PREFIX="${build_dir}" \
-        -DCMAKE_BUILD_TYPE=Release \
-        -B"${build_dir}"/examples/models/llama \
-        examples/models/llama
-    # Build the export llama runner
-    cmake --build cmake-out/examples/models/llama -j$(nproc) --config Release
-}
-
 build_python_enabled() {
     echo "Building Python Package with Pybinding"
 
     # Enter the Executorch root directory
-    cd "$EXECUTORCH_ROOT"
-    ./install_executorch.sh --clean
 
     # Set parameters to configure the project with CMake
     # Note: Add any additional configuration options you need here
@@ -78,32 +64,29 @@ build_python_enabled() {
     export CMAKE_BUILD_ARGS="--target openvino_backend"
 
     # Build the package
-    ./install_executorch.sh --minimal
-
-    # Install torchao
-    pip install third-party/ao
+    ./install_executorch.sh
 }
 
 main() {
     build_type=${1:-"--build_all"}
 
-    # If the first arguments is --build_all (default), build python package, C++ runtime, and llama runner binary
+    # If the first argument is --build_all (default), build python package, C++ runtime
     if [[ -z "$build_type" || "$build_type" == "--build_all" ]]; then
+        ./install_executorch.sh --clean
         install_requirements
         build_python_enabled
         build_cpp_runtime
-        build_llama_runner
 
-    # If the first arguments is --cpp_runtime, build libraries for C++ runtime
+    # If the first argument is --cpp_runtime, build libraries for C++ runtime
     elif [[ "$build_type" == "--cpp_runtime" ]]; then
         build_cpp_runtime
 
-    # If the first arguments is --llama_runner, build export llama runner binary
-    # Note: c++ runtime with openvino backend should be built before building export llama runner
-    elif [[ "$build_type" == "--llama_runner" ]]; then
-        build_llama_runner
+    # If the first argument is --cpp_runtime_llm, build C++ runtime with llm extension
+    # Note: c++ runtime with openvino backend should be built before building llama runner
+    elif [[ "$build_type" == "--cpp_runtime_llm" ]]; then
+        build_cpp_runtime 1
 
-    # If the first arguments is --enable_python, build python package with python bindings
+    # If the first argument is --enable_python, build python package with python bindings
     elif [[ "$build_type" == "--enable_python" ]]; then
         install_requirements
         build_python_enabled

@@ -2,7 +2,7 @@ cmake_minimum_required(VERSION 3.5)
 
 project(Yolo12DetectionDemo VERSION 0.1)
 
-option(USE_OPENVINO_BACKEND "Build the tutorial with the OPENVINO backend" ON)
+option(USE_OPENVINO_BACKEND "Build the tutorial with the OPENVINO backend" OFF)
 option(USE_XNNPACK_BACKEND "Build the tutorial with the XNNPACK backend" OFF)
 
 set(CMAKE_INCLUDE_CURRENT_DIR ON)
@@ -38,21 +38,13 @@ list(APPEND link_libraries portable_ops_lib portable_kernels)
 executorch_target_link_options_shared_lib(portable_ops_lib)
 
 if(USE_XNNPACK_BACKEND)
-  set(xnnpack_backend_libs xnnpack_backend XNNPACK microkernels-prod)
+  set(xnnpack_backend_libs xnnpack_backend XNNPACK xnnpack-microkernels-prod)
   list(APPEND link_libraries ${xnnpack_backend_libs})
   executorch_target_link_options_shared_lib(xnnpack_backend)
 endif()
 
 if(USE_OPENVINO_BACKEND)
-  add_subdirectory(${EXECUTORCH_ROOT}/backends/openvino openvino_backend)
-
-  target_include_directories(
-    openvino_backend
-    INTERFACE
-      ${CMAKE_CURRENT_BINARY_DIR}/../../include
-      ${CMAKE_CURRENT_BINARY_DIR}/../../include/executorch/runtime/core/portable_type/c10
-      ${CMAKE_CURRENT_BINARY_DIR}/../../lib
-  )
+  find_package(OpenVINO REQUIRED)
   list(APPEND link_libraries openvino_backend)
   executorch_target_link_options_shared_lib(openvino_backend)
 endif()

@@ -31,15 +31,13 @@ To install ExecuTorch, follow this [guide](https://pytorch.org/executorch/stable
 
 ### Step 3: Install the demo requirements
 
-Python demo requirements:
+#### Python Demo Requirements
+The demo requires the `ultralytics` package, which depends on `torch` and `torchvision`. Since these packages are already installed as dev dependencies, use `--upgrade-strategy only-if-needed` to avoid version conflicts:
 
 ```bash
-python -m pip install -r examples/models/yolo12/requirements.txt
+python -m pip install --upgrade-strategy only-if-needed -r requirements.txt
 ```
 
-Demo infenrece dependency - OpenCV library:
-<https://opencv.org/get-started/>
-
 ### Step 4: Export the YOLO12 model to the ExecuTorch
 
 OpenVINO:
@@ -51,7 +49,7 @@ python export_and_validate.py --model_name yolo12s --input_dims=[1920,1080]  --b
 OpenVINO quantized model:
 
 ```bash
-python export_and_validate.py --model_name yolo12s --input_dims=[1920,1080]  --backend openvino --quantize --video_input /path/to/calibration/video --device CPU
+python export_and_validate.py --model_name yolo12s --input_dims=[1920,1080]  --backend openvino --quantize --video_path /path/to/calibration/video --device CPU
 ```
 
 XNNPACK:

@@ -1 +1,2 @@
-ultralytics==8.3.97
+ultralytics==8.3.196
+opencv-python
diff --git a/examples/openvino/README.md b/examples/openvino/README.md
@@ -13,6 +13,11 @@ examples/openvino
 └── llama
     ├── README.md                       # Documentation for Llama example
     └── llama3_2_ov_4wo.yaml            # Configuration file for exporting Llama3.2 with OpenVINO backend
+└── stable_diffusion
+    ├── README.md                       # Documentation for Stable Diffusion example
+    ├── export_lcm.py                   # Script for exporting models
+    ├── openvino_lcm.py                 # Script for inference execution
+    └── requirements.txt                # Requirements file for Stable Diffusion example
 ```
 
 # Build Instructions for Examples

diff --git a/examples/openvino/llama/README.md b/examples/openvino/llama/README.md
@@ -28,13 +28,19 @@ python -m executorch.extension.llm.export.export_llm \
 OpenVINO backend also offers Quantization support for llama models when exporting the model. The different quantization modes that are offered are INT4 groupwise & per-channel weights compression and INT8 per-channel weights compression. It can be achieved by setting `pt2e_quantize` option in `llama3_2_ov_4wo.yaml` file under `quantization`. Set this parameter to `openvino_4wo` for INT4 or `openvino_8wo` for INT8 weight compression. It is set to `openvino_4wo` in `llama3_2_ov_4wo.yaml` file by default. For modifying the group size, set `group_size` option in `llama3_2_ov_4wo.yaml` file under `quantization`. By default group size 128 is used to achieve optimal performance with the NPU.
 
 ## Build OpenVINO C++ Runtime with Llama Runner:
-First, build the backend libraries by executing the script below in `<executorch_root>/backends/openvino/scripts` folder:
+First, build the backend libraries with llm extension by executing the script below in `<executorch_root>/backends/openvino/scripts` folder:
 ```bash
-./openvino_build.sh --cpp_runtime
+./openvino_build.sh --cpp_runtime_llm
 ```
-Then, build the llama runner by executing the script below (with `--llama_runner` argument) also in `<executorch_root>/backends/openvino/scripts` folder:
+Then, build the llama runner by executing commands below in `<executorch_root>` folder:
 ```bash
-./openvino_build.sh --llama_runner
+# Configure the project with CMake
+cmake -DCMAKE_INSTALL_PREFIX=cmake-out \
+      -DCMAKE_BUILD_TYPE=Release \
+      -Bcmake-out/examples/models/llama \
+      examples/models/llama
+# Build the llama runner
+cmake --build cmake-out/examples/models/llama -j$(nproc) --config Release
 ```
 The executable is saved in `<executorch_root>/cmake-out/examples/models/llama/llama_main`
 

diff --git a/examples/openvino/stable_diffusion/README.md b/examples/openvino/stable_diffusion/README.md
@@ -45,4 +45,4 @@ python openvino_lcm.py \
 
 This implementation supports LCM-based Stable Diffusion models:
 - **SimianLuo/LCM_Dreamshaper_v7**
-- **latent-consistency/lcm-sdxl**
+- **latent-consistency/lcm-sdxl**
diff --git a/examples/openvino/stable_diffusion/requirements.txt b/examples/openvino/stable_diffusion/requirements.txt
@@ -1 +1 @@
-diffusers>=0.29.0
+diffusers>=0.29.0
Original file line number	Diff line number	Diff line change
		@@ -1,2 +1 @@
		transformers
		git+https://github.com/openvinotoolkit/nncf@3d753ac#egg=nncf