pytorch
diff --git a/‎.ci/scripts/test_yolo12.sh‎ ‎.ci/scripts/test_yolo26.sh‎.ci/scripts/test_yolo12.sh renamed to .ci/scripts/test_yolo26.sh
Lines changed: 29 additions & 30 deletions b/‎.ci/scripts/test_yolo12.sh‎ ‎.ci/scripts/test_yolo26.sh‎.ci/scripts/test_yolo12.sh renamed to .ci/scripts/test_yolo26.sh
Lines changed: 29 additions & 30 deletions
diff --git a/‎.github/labeler.yml‎
Lines changed: 15 additions & 0 deletions b/‎.github/labeler.yml‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎.github/workflows/labeler.yml‎
Lines changed: 14 additions & 0 deletions b/‎.github/workflows/labeler.yml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎.github/workflows/pull.yml‎
Lines changed: 53 additions & 2 deletions b/‎.github/workflows/pull.yml‎
Lines changed: 53 additions & 2 deletions
diff --git a/‎.lintrunner.toml‎
Lines changed: 1 addition & 0 deletions b/‎.lintrunner.toml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎backends/cadence/aot/compiler_funcs.py‎
Lines changed: 13 additions & 7 deletions b/‎backends/cadence/aot/compiler_funcs.py‎
Lines changed: 13 additions & 7 deletions
@@ -6,6 +6,7 @@
 # LICENSE file in the root directory of this source tree.
 
 set -ex
+
 # shellcheck source=/dev/null
 source "$(dirname "${BASH_SOURCE[0]}")/utils.sh"
 
@@ -50,21 +51,21 @@ PT2E_QUANTIZE="${PT2E_QUANTIZE:-}"
 # Default CMake Build Type to release mode
 CMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE:-Release}
 
-if [[ $# -lt 5 ]]; then # Assuming 4 mandatory args
-    echo "Expecting atleast 5 positional arguments"
-    echo "Usage: [...]"
-fi
 if [[ -z "${MODEL_NAME:-}" ]]; then
   echo "Missing model name, exiting..."
   exit 1
 fi
 
-
 if [[ -z "${MODE:-}" ]]; then
   echo "Missing mode, choose openvino or xnnpack, exiting..."
   exit 1
 fi
 
+if [[ -z "${VIDEO_PATH:-}" ]]; then
+  echo "Missing video path, exiting..."
+  exit 1
+fi
+
 if [[ -z "${PYTHON_EXECUTABLE:-}" ]]; then
   PYTHON_EXECUTABLE=python3
 fi
@@ -75,21 +76,13 @@ if [[ "${MODE}" =~ .*openvino.* ]]; then
   OPENVINO=ON
   TARGET_LIBS="$TARGET_LIBS openvino_backend "
 
-  git clone https://github.com/openvinotoolkit/openvino.git
-  cd openvino && git b16b776ac119dafda51f69a80f1e6b7376d02c3b
-  git submodule update --init --recursive
-  sudo ./install_build_dependencies.sh
-  mkdir build && cd build
-  cmake .. -DCMAKE_BUILD_TYPE=Release -DENABLE_PYTHON=ON
-  make -j$(nproc)
-
-  cd ..
-  cmake --install build --prefix dist
-
-  source dist/setupvars.sh
-  cd ../backends/openvino
-  pip install -r requirements.txt
-  cd ../../
+  # Install specific OpenVINO runtime from pip.
+  $PYTHON_EXECUTABLE -m pip install --pre openvino==2026.1.0.dev20260131 --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
+  $PYTHON_EXECUTABLE -m pip install -r backends/openvino/requirements.txt
+
+  # Set OPENVINO_LIB_PATH so the C++ demo runner can also find libopenvino_c.so.
+  OPENVINO_LIB_PATH=$($PYTHON_EXECUTABLE -c "import openvino, os, glob; print(sorted(glob.glob(os.path.join(os.path.dirname(openvino.__file__), 'libs', 'libopenvino_c.so*')))[-1])")
+  export OPENVINO_LIB_PATH
 else
   OPENVINO=OFF
 fi
@@ -103,9 +96,10 @@ fi
 
 which "${PYTHON_EXECUTABLE}"
 
+TORCH_URL=https://download.pytorch.org/whl/cpu
 
-DIR="examples/models/yolo12"
-$PYTHON_EXECUTABLE -m pip install -r ${DIR}/requirements.txt
+DIR="examples/models/yolo26"
+$PYTHON_EXECUTABLE -m pip install --upgrade-strategy only-if-needed --extra-index-url "$TORCH_URL" -r ${DIR}/requirements.txt
 
 cmake_install_executorch_libraries() {
     rm -rf cmake-out
@@ -142,11 +136,11 @@ cmake_install_executorch_libraries() {
 
     echo $TARGET_LIBS
     export CMAKE_BUILD_ARGS="--target $TARGET_LIBS"
-    pip install . --no-build-isolation
+    $PYTHON_EXECUTABLE -m pip install . --no-build-isolation
 }
 
 cmake_build_demo() {
-    echo "Building yolo12 runner"
+    echo "Building yolo26 runner"
     retry cmake \
         -DCMAKE_BUILD_TYPE="$CMAKE_BUILD_TYPE" \
         -DUSE_OPENVINO_BACKEND="$OPENVINO" \
@@ -174,24 +168,29 @@ prepare_artifacts_upload() {
 
 
 # Export model.
-EXPORTED_MODEL_NAME="${MODEL_NAME}_fp32_${MODE}.pte"
-echo "Exporting ${EXPORTED_MODEL_NAME}"
 EXPORT_ARGS="--model_name=${MODEL_NAME} --backend=${MODE}"
+if [[ -n "${PT2E_QUANTIZE}" ]]; then
+  EXPORTED_MODEL_NAME="${MODEL_NAME}_int8_${MODE}.pte"
+  EXPORT_ARGS="${EXPORT_ARGS} --quantize --video_path=${VIDEO_PATH}"
+else
+  EXPORTED_MODEL_NAME="${MODEL_NAME}_fp32_${MODE}.pte"
+fi
+echo "Exporting ${EXPORTED_MODEL_NAME}"
 
 # Add dynamically linked library location
 cmake_install_executorch_libraries
 
-$PYTHON_EXECUTABLE -m examples.models.yolo12.export_and_validate ${EXPORT_ARGS}
+$PYTHON_EXECUTABLE -m examples.models.yolo26.export_and_validate ${EXPORT_ARGS}
 
 
 RUNTIME_ARGS="--model_path=${EXPORTED_MODEL_NAME} --input_path=${VIDEO_PATH}"
 # Check build tool.
 cmake_build_demo
-# Run yolo12 runner
+# Run yolo26 runner
 NOW=$(date +"%H:%M:%S")
-echo "Starting to run yolo12 runner at ${NOW}"
+echo "Starting to run yolo26 runner at ${NOW}"
 # shellcheck source=/dev/null
-cmake-out/examples/models/yolo12/Yolo12DetectionDemo ${RUNTIME_ARGS} > result.txt
+cmake-out/examples/models/yolo26/Yolo26DetectionDemo ${RUNTIME_ARGS} > result.txt
 NOW=$(date +"%H:%M:%S")
 echo "Finished at ${NOW}"
 
 
@@ -0,0 +1,15 @@
+"module: arm":
+- changed-files:
+  - any-glob-to-any-file:
+    - 'backends/arm/**'
+    - 'examples/arm/**'
+    - 'docs/source/backends/arm-*/**'
+    - 'docs/source/embedded-arm-ethos-u.md'
+    - 'docs/source/android-arm-vgf.md'
+    - 'docs/source/arm-delegate-runtime-build.svg'
+
+ciflow/trunk:
+- changed-files:
+  - any-glob-to-any-file:
+    - 'backends/arm/**'
+    - 'examples/arm/**'
@@ -0,0 +1,14 @@
+name: Labeler
+on:
+  pull_request_target:
+    types: [opened, synchronize, reopened, ready_for_review]
+
+permissions:
+  contents: read
+  pull-requests: write
+
+jobs:
+  label:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/labeler@v5
@@ -857,6 +857,8 @@ jobs:
       id-token: write
       contents: read
     strategy:
+      matrix:
+        model: [mv2, mv3, dl3]
       fail-fast: false
     with:
       runner: linux.2xlarge
@@ -868,9 +870,58 @@ jobs:
         # The generic Linux job chooses to use base env, not the one setup by the image
         CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]")
         conda activate "${CONDA_ENV}"
+        PYTHON_EXECUTABLE=python bash .ci/scripts/setup-linux.sh --build-tool cmake
+        PYTHON_EXECUTABLE=python bash .ci/scripts/setup-qnn-deps.sh
+        PYTHON_EXECUTABLE=python bash .ci/scripts/build-qnn-sdk.sh
+        PYTHON_EXECUTABLE=python bash .ci/scripts/test_model.sh ${{ matrix.model }} "cmake" "qnn"
+
+  test-qnn-testsuite-linux:
+    name: test-qnn-testsuite-linux
+    permissions:
+      id-token: write
+      contents: read
+    uses: ./.github/workflows/_test_backend.yml
+    with:
+      backend: qnn
+      flows: '["qnn"]'
+      ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
+      timeout: 120
+      run-linux: true
+      runner-linux: linux.2xlarge
+
+  test-qnn-passes-linux:
+    name: test-qnn-passes-linux
+    uses: pytorch/test-infra/.github/workflows/linux_job_v2.yml@main
+    permissions:
+      id-token: write
+      contents: read
+    strategy:
+      fail-fast: false
+    with:
+      runner: linux.2xlarge
+      docker-image: ci-image:executorch-ubuntu-22.04-qnn-sdk
+      submodules: 'recursive'
+      ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
+      timeout: 30
+      script: |
+        # The generic Linux job chooses to use base env, not the one setup by the image
+        CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]")
+        conda activate "${CONDA_ENV}"
+
+        PYTHON_EXECUTABLE=python bash .ci/scripts/setup-qnn-deps.sh
+        # Source (not bash) so QNN_SDK_ROOT stays in the environment
+        PYTHON_EXECUTABLE=python source .ci/scripts/build-qnn-sdk.sh
+
+        # Editable install so the PyQnnManagerAdaptor .so built by build-qnn-sdk.sh
+        # is visible in the source tree (the _passes import chain pulls it in transitively)
+        CMAKE_ARGS="-DEXECUTORCH_BUILD_QNN=ON -DQNN_SDK_ROOT=$QNN_SDK_ROOT -DEXECUTORCH_BUILD_EXTENSION_TENSOR=ON" \
+          PYTHON_EXECUTABLE=python bash .ci/scripts/setup-linux.sh --build-tool cmake --editable true
+
+        # test_mha_to_sha imports oss_scripts/llama which transitively needs torchtune
+        pip install -r requirements-examples.txt
 
-        # placeholder for running test_qnn_delegate.py, can use matrix such that we can trigger different jobs, refers to test-llama-runner-qnn-linux
-        # reminder: make sure each job runs fast
+        # Run QNN pass unit tests
+        pytest -xvs backends/qualcomm/tests/test_passes.py
 
   test-phi-3-mini-runner-linux:
     name: test-phi-3-mini-runner-linux
 
@@ -225,6 +225,7 @@ exclude_patterns = [
     'extension/llm/tokenizers/**',
     'backends/cadence/utils/FACTO',
     'examples/cuda',
+    'examples/qualcomm',
     'kernels/portable',
     # File contains @generated
     'extension/llm/custom_ops/spinquant/fast_hadamard_transform_special.h',
 
@@ -204,7 +204,7 @@ ExecuTorch powers on-device AI at scale across Meta's family of apps, VR/AR devi
 
 **Multimodal:** [Llava](examples/models/llava/README.md) (vision-language), [Voxtral](examples/models/voxtral/README.md) (audio-language), [Gemma](examples/models/gemma3) (vision-language)
 
-**Vision/Speech:** [MobileNetV2](https://github.com/meta-pytorch/executorch-examples/tree/main/mv2), [DeepLabV3](https://github.com/meta-pytorch/executorch-examples/tree/main/dl3), [Whisper](examples/models/whisper/README.md) <!-- @lint-ignore -->
+**Vision/Speech:** [MobileNetV2](https://github.com/meta-pytorch/executorch-examples/tree/main/mv2), [DeepLabV3](https://github.com/meta-pytorch/executorch-examples/tree/main/dl3), [YOLO26](examples/models/yolo26/README.md), [Whisper](examples/models/whisper/README.md) <!-- @lint-ignore -->
 
 **Resources:** [`examples/`](examples/) directory • [executorch-examples](https://github.com/meta-pytorch/executorch-examples) out-of-tree demos • [Optimum-ExecuTorch](https://github.com/huggingface/optimum-executorch) for HuggingFace models • [Unsloth](https://docs.unsloth.ai/new/deploy-llms-phone) for fine-tuned LLM deployment <!-- @lint-ignore -->
 
 
@@ -8,7 +8,8 @@
 
 import logging
 import operator
-from typing import Any, Optional, Union
+from collections.abc import Mapping, Sequence
+from typing import Any, cast, Optional, Union
 
 import torch
 from torch._inductor.decomposition import remove_decompositions
@@ -301,23 +302,27 @@ def __init__(
                 "Warning: Using pre-quantized inputs. This should only be done when calibration has been confirmed."
                 "Incorrect quantization parameters can lead to significant accuracy degradation."
             )
-        if isinstance(input_args, list):
-            self.quant_args = extract_input_quant_params_from_graph(module, input_args)
-        elif isinstance(input_args, dict):
+        if isinstance(input_args, Sequence) and not isinstance(
+            input_args, (str, bytes)
+        ):
+            self.quant_args = extract_input_quant_params_from_graph(
+                module, list(input_args)
+            )
+        elif isinstance(input_args, Mapping):
             # dict[int, QuantArgs] — use directly
             # dict[int, list[str]] — extract quant params from graph, keyed by input index
             first_value = next(iter(input_args.values()), None)
             if (
-                isinstance(first_value, (list, tuple))
+                isinstance(first_value, (list, tuple, Sequence))
+                and not isinstance(first_value, (str, bytes))
                 and first_value
                 and isinstance(first_value[0], str)
             ):
                 # Values are lists of node names: extract quant params and map
                 # to the caller-specified input indices.
                 for input_idx, node_names in input_args.items():
-                    assert isinstance(node_names, list)
                     extracted = extract_input_quant_params_from_graph(
-                        module, node_names
+                        module, list(cast(Sequence[str], node_names))
                     )
                     # Use the first extracted quant params for this input index.
                     if extracted:
@@ -430,6 +435,7 @@ def _get_transparent_ops() -> set[Any]:
         torch.ops.aten.view.default,
         torch.ops.aten.reshape.default,
         torch.ops.aten.split.Tensor,
+        torch.ops.aten.chunk.default,
         torch.ops.aten.slice_copy.Tensor,
         torch.ops.aten.permute_copy.default,
         torch.ops.aten.permute.default,