pytorch
diff --git a/‎.ci/scripts/setup-samsung-linux-deps.sh‎
Lines changed: 0 additions & 9 deletions b/‎.ci/scripts/setup-samsung-linux-deps.sh‎
Lines changed: 0 additions & 9 deletions
diff --git a/‎.ci/scripts/test_model.ps1‎
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/test_model.ps1‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.ci/scripts/wheel/pre_build_script.sh‎
Lines changed: 18 additions & 1 deletion b/‎.ci/scripts/wheel/pre_build_script.sh‎
Lines changed: 18 additions & 1 deletion
diff --git a/‎.ci/scripts/wheel/test_windows.py‎
Lines changed: 75 additions & 0 deletions b/‎.ci/scripts/wheel/test_windows.py‎
Lines changed: 75 additions & 0 deletions
diff --git a/‎.ci/scripts/wheel/vc_env_helper.bat‎
Lines changed: 61 additions & 0 deletions b/‎.ci/scripts/wheel/vc_env_helper.bat‎
Lines changed: 61 additions & 0 deletions
diff --git a/‎.github/workflows/build-wheels-windows.yml‎
Lines changed: 59 additions & 0 deletions b/‎.github/workflows/build-wheels-windows.yml‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎.github/workflows/pull.yml‎
Lines changed: 9 additions & 2 deletions b/‎.github/workflows/pull.yml‎
Lines changed: 9 additions & 2 deletions
diff --git a/‎.github/workflows/trunk.yml‎
Lines changed: 3 additions & 0 deletions b/‎.github/workflows/trunk.yml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎backends/apple/coreml/recipes/coreml_recipe_provider.py‎
Lines changed: 5 additions & 2 deletions b/‎backends/apple/coreml/recipes/coreml_recipe_provider.py‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎backends/apple/coreml/test/test_coreml_quantizer.py‎
Lines changed: 2 additions & 4 deletions b/‎backends/apple/coreml/test/test_coreml_quantizer.py‎
Lines changed: 2 additions & 4 deletions
@@ -54,15 +54,6 @@ install_enn_backend() {
   rm -rf "${NDK_INSTALLATION_DIR}" && sudo mkdir -p "${NDK_INSTALLATION_DIR}"
   ANDROID_NDK_VERSION=r27b
 
-  pushd .
-  cd /tmp
-  curl -Os --retry 3 "https://ossci-android.s3.amazonaws.com/android-ndk-${ANDROID_NDK_VERSION}-linux.zip"
-  unzip -qo "android-ndk-${ANDROID_NDK_VERSION}-linux.zip"
-
-  # Print the content for manual verification
-  ls -lah "android-ndk-${ANDROID_NDK_VERSION}"
-  sudo mv "android-ndk-${ANDROID_NDK_VERSION}"/* "${NDK_INSTALLATION_DIR}"
-  popd
   # build Exynos backend
   export ANDROID_NDK_ROOT=${ANDROID_NDK_ROOT:-/opt/ndk}
   bash backends/samsung/build.sh --build all
 
@@ -34,7 +34,7 @@ function ExportModel-Xnnpack {
         [bool]$quantize
     )
 
-    if $(quantize) {
+    if ($quantize) {
         python -m examples.xnnpack.aot_compiler --model_name="${MODEL_NAME}" --delegate --quantize | Write-Host
         $modelFile = "$($modelName)_xnnpack_q8.pte"
     } else {
 
@@ -9,9 +9,26 @@ set -euxo pipefail
 
 # This script is run before building ExecuTorch binaries
 
+# Clone nested submodules for tokenizers - this is a workaround for recursive
+# submodule clone failing due to path length limitations on Windows. Eventually,
+# we should update the core job in test-infra to enable long paths before
+# checkout to avoid needing to do this.
+pushd extension/llm/tokenizers
+git submodule update --init
+popd
+
+# On Windows, enable symlinks and re-checkout the current revision to create
+# the symlinked src/ directory. This is needed to build the wheel.
+UNAME_S=$(uname -s)
+if [[ $UNAME_S == *"MINGW"* || $UNAME_S == *"MSYS"* ]]; then
+    echo "Enabling symlinks on Windows"
+    git config core.symlinks true
+    git checkout -f HEAD
+fi
+
 # Manually install build requirements because `python setup.py bdist_wheel` does
 # not install them. TODO(dbort): Switch to using `python -m build --wheel`,
 # which does install them. Though we'd need to disable build isolation to be
 # able to see the installed torch package.
 
-"${GITHUB_WORKSPACE}/${REPOSITORY}/install_requirements.sh"  --example
+"${GITHUB_WORKSPACE}/${REPOSITORY}/install_requirements.sh" --example
@@ -0,0 +1,75 @@
+#!/usr/bin/env python
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+from typing import List
+
+import torch
+from executorch.backends.xnnpack.partition.xnnpack_partitioner import XnnpackPartitioner
+from executorch.examples.models import Backend, Model, MODEL_NAME_TO_MODEL
+from executorch.examples.models.model_factory import EagerModelFactory
+from executorch.examples.xnnpack import MODEL_NAME_TO_OPTIONS
+from executorch.examples.xnnpack.quantization.utils import quantize as quantize_xnn
+from executorch.exir import EdgeCompileConfig, to_edge_transform_and_lower
+from executorch.extension.pybindings.portable_lib import (
+    _load_for_executorch_from_buffer,
+)
+from test_base import ModelTest
+
+
+def test_model_xnnpack(model: Model, quantize: bool) -> None:
+    model_instance, example_inputs, _, _ = EagerModelFactory.create_model(
+        *MODEL_NAME_TO_MODEL[str(model)]
+    )
+
+    model_instance.eval()
+    ref_outputs = model_instance(*example_inputs)
+
+    if quantize:
+        quant_type = MODEL_NAME_TO_OPTIONS[str(model)].quantization
+        model_instance = torch.export.export_for_training(
+            model_instance, example_inputs
+        )
+        model_instance = quantize_xnn(
+            model_instance.module(), example_inputs, quant_type
+        )
+
+    lowered = to_edge_transform_and_lower(
+        torch.export.export(model_instance, example_inputs),
+        partitioner=[XnnpackPartitioner()],
+        compile_config=EdgeCompileConfig(
+            _check_ir_validity=False,
+        ),
+    ).to_executorch()
+
+    loaded_model = _load_for_executorch_from_buffer(lowered.buffer)
+    et_outputs = loaded_model([*example_inputs])
+
+    if isinstance(ref_outputs, torch.Tensor):
+        ref_outputs = (ref_outputs,)
+
+    assert len(ref_outputs) == len(et_outputs)
+    for i in range(len(ref_outputs)):
+        torch.testing.assert_close(ref_outputs[i], et_outputs[i], atol=1e-4, rtol=1e-5)
+
+
+def run_tests(model_tests: List[ModelTest]) -> None:
+    for model_test in model_tests:
+        if model_test.backend == Backend.Xnnpack:
+            test_model_xnnpack(model_test.model, quantize=False)
+        else:
+            raise RuntimeError(f"Unsupported backend {model_test.backend}.")
+
+
+if __name__ == "__main__":
+    run_tests(
+        model_tests=[
+            ModelTest(
+                model=Model.Mv3,
+                backend=Backend.Xnnpack,
+            ),
+        ]
+    )
@@ -0,0 +1,61 @@
+REM This is lightly modified from the torchvision Windows build logic.
+REM See https://github.com/pytorch/vision/blob/main/packaging/windows/internal/vc_env_helper.bat
+
+@echo on
+
+set VC_VERSION_LOWER=17
+set VC_VERSION_UPPER=18
+
+for /f "usebackq tokens=*" %%i in (`"%ProgramFiles(x86)%\Microsoft Visual Studio\Installer\vswhere.exe" -legacy -products * -version [%VC_VERSION_LOWER%^,%VC_VERSION_UPPER%^) -property installationPath`) do (
+    if exist "%%i" if exist "%%i\VC\Auxiliary\Build\vcvarsall.bat" (
+        set "VS15INSTALLDIR=%%i"
+        set "VS15VCVARSALL=%%i\VC\Auxiliary\Build\vcvarsall.bat"
+        goto vswhere
+    )
+)
+
+:vswhere
+if "%VSDEVCMD_ARGS%" == "" (
+    call "%VS15VCVARSALL%" x64 || exit /b 1
+) else (
+    call "%VS15VCVARSALL%" x64 %VSDEVCMD_ARGS% || exit /b 1
+)
+
+@echo on
+
+if "%CU_VERSION%" == "xpu" call "C:\Program Files (x86)\Intel\oneAPI\setvars.bat"
+
+set DISTUTILS_USE_SDK=1
+
+set args=%1
+shift
+:start
+if [%1] == [] goto done
+set args=%args% %1
+shift
+goto start
+
+:done
+if "%args%" == "" (
+    echo Usage: vc_env_helper.bat [command] [args]
+    echo e.g. vc_env_helper.bat cl /c test.cpp
+)
+
+set work_dir=%CD%
+if exist setup.py (
+    echo "Creating symlink..."
+    REM Setup a symlink to shorten the path length.
+    REM Note that the ET directory has to be named "executorch".
+    cd %GITHUB_WORKSPACE%
+    if not exist et\ (
+        mkdir et
+    )
+    cd et
+    echo Work dir: %work_dir%
+    if not exist executorch\ (
+        mklink /d executorch %work_dir%
+    )
+    cd executorch
+)
+
+%args% || exit /b 1
@@ -0,0 +1,59 @@
+name: Build Windows Wheels
+
+on:
+  pull_request:
+  push:
+    branches:
+      - nightly
+      - main
+      - release/*
+    tags:
+        # NOTE: Binary build pipelines should only get triggered on release candidate builds
+        # Release candidate tags look like: v1.11.0-rc1
+        - v[0-9]+.[0-9]+.[0-9]+-rc[0-9]+
+  workflow_dispatch:
+
+permissions:
+  id-token: write
+  contents: read
+
+jobs:
+  generate-matrix:
+    uses: pytorch/test-infra/.github/workflows/generate_binary_build_matrix.yml@main
+    with:
+      package-type: wheel
+      os: windows
+      test-infra-repository: pytorch/test-infra
+      test-infra-ref: main
+      with-cuda: disabled
+      with-rocm: disabled
+      python-versions: '["3.10", "3.11", "3.12"]'
+
+  build:
+    needs: generate-matrix
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - repository: pytorch/executorch
+            pre-script: .ci\\scripts\\wheel\\pre_build_script.sh
+            env-script: .ci\\scripts\\wheel\\vc_env_helper.bat
+            post-script: .ci\\scripts\\wheel\\post_build_script.sh
+            smoke-test-script: .ci/scripts/wheel/test_windows.py
+            package-name: executorch
+    name: ${{ matrix.repository }}
+    uses: pytorch/test-infra/.github/workflows/build_wheels_windows.yml@main
+    with:
+      repository: ${{ matrix.repository }}
+      ref: ""
+      test-infra-repository: pytorch/test-infra
+      test-infra-ref: main
+      build-matrix: ${{ needs.generate-matrix.outputs.matrix }}
+      pre-script: ${{ matrix.pre-script }}
+      env-script: ${{ matrix.env-script }}
+      post-script: ${{ matrix.post-script }}
+      package-name: ${{ matrix.package-name }}
+      smoke-test-script: ${{ matrix.smoke-test-script }}
+      trigger-event: ${{ github.event_name }}
+      wheel-build-params: "--verbose"
+      submodules: true
@@ -874,7 +874,7 @@ jobs:
       contents: read
     with:
       runner: linux.2xlarge
-      docker-image: ci-image:executorch-ubuntu-22.04-gcc9
+      docker-image: ci-image:executorch-ubuntu-22.04-clang12-android
       submodules: 'recursive'
       ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
       timeout: 90
@@ -892,7 +892,7 @@ jobs:
         source .ci/scripts/setup-samsung-linux-deps.sh
 
         # Test models serially
-        models="mv2 ic3 resnet18 resnet50"
+        models="mv2 ic3 resnet18 resnet50 mv3 ic4 dl3 edsr vit w2l"
         for model in $models; do
           python -m executorch.examples.samsung.aot_compiler --model_name=$model -c E9955
         done
@@ -971,6 +971,13 @@ jobs:
         ./cmake-out/backends/vulkan/test/custom_ops/q4gsw_linear
         ./cmake-out/backends/vulkan/test/custom_ops/choose_qparams_per_row
 
+        # "Classic" Operator tests
+        PYTHON_EXECUTABLE=python bash backends/vulkan/test/scripts/test_op.sh --build
+        # TODO(ssjia): figure out how to run custom op tests in CI. Currently, they are
+        # failing due to to the libstdc++.so.6 installed with conda not supporting
+        # GLIBCXX_3.4.30. These tests are still run in Meta internal CI.
+        # ./cmake-out/backends/vulkan/test/op_tests/vulkan_sdpa_test
+
         # Run e2e testing for selected operators. More operators will be tested via this
         # route in the future.
         python -m unittest backends/vulkan/test/test_vulkan_delegate.py -k "*pt2e*"
 
@@ -8,6 +8,9 @@ on:
     tags:
       - ciflow/trunk/*
   pull_request:
+    paths:
+      - .ci/docker/ci_commit_pins/pytorch.txt
+      - .ci/scripts/**
   workflow_dispatch:
 
 concurrency:
 
@@ -69,6 +69,7 @@ def create_recipe(
                 recipe_type, activation_dtype=torch.float32, **kwargs
             )
         elif recipe_type == CoreMLRecipeType.TORCHAO_INT4_WEIGHT_ONLY_PER_CHANNEL:
+            self._validate_and_set_deployment_target(kwargs, ct.target.iOS18, "torchao")
             return self._build_torchao_quantized_recipe(
                 recipe_type,
                 weight_dtype=torch.int4,
@@ -77,6 +78,7 @@ def create_recipe(
             )
         elif recipe_type == CoreMLRecipeType.TORCHAO_INT4_WEIGHT_ONLY_PER_GROUP:
             group_size = kwargs.pop("group_size", 32)
+            self._validate_and_set_deployment_target(kwargs, ct.target.iOS18, "torchao")
             return self._build_torchao_quantized_recipe(
                 recipe_type,
                 weight_dtype=torch.int4,
@@ -85,11 +87,14 @@ def create_recipe(
                 **kwargs,
             )
         elif recipe_type == CoreMLRecipeType.TORCHAO_INT8_WEIGHT_ONLY_PER_CHANNEL:
+            self._validate_and_set_deployment_target(kwargs, ct.target.iOS16, "torchao")
             return self._build_torchao_quantized_recipe(
                 recipe_type, weight_dtype=torch.int8, is_per_channel=True, **kwargs
             )
         elif recipe_type == CoreMLRecipeType.TORCHAO_INT8_WEIGHT_ONLY_PER_GROUP:
             group_size = kwargs.pop("group_size", 32)
+            # override minimum_deployment_target to ios18 for torchao (GH issue #13122)
+            self._validate_and_set_deployment_target(kwargs, ct.target.iOS18, "torchao")
             return self._build_torchao_quantized_recipe(
                 recipe_type,
                 weight_dtype=torch.int8,
@@ -312,8 +317,6 @@ def _build_torchao_quantized_recipe(
             ao_quantization_configs=[config],
         )
 
-        # override minimum_deployment_target to ios18 for torchao (GH issue #13122)
-        self._validate_and_set_deployment_target(kwargs, ct.target.iOS18, "torchao")
         lowering_recipe = self._get_coreml_lowering_recipe(**kwargs)
 
         return ExportRecipe(
 
@@ -15,7 +15,7 @@
 )
 
 from executorch.backends.apple.coreml.quantizer import CoreMLQuantizer
-from torch.export import export_for_training
+from torch.export import export
 from torchao.quantization.pt2e.quantize_pt2e import (
     convert_pt2e,
     prepare_pt2e,
@@ -32,9 +32,7 @@ def quantize_and_compare(
     ) -> None:
         assert quantization_type in {"PTQ", "QAT"}
 
-        pre_autograd_aten_dialect = export_for_training(
-            model, example_inputs, strict=True
-        ).module()
+        pre_autograd_aten_dialect = export(model, example_inputs, strict=True).module()
 
         quantization_config = LinearQuantizerConfig.from_dict(
             {
Original file line number	Diff line number	Diff line change
`@@ -34,7 +34,7 @@ function ExportModel-Xnnpack {`
`34`	`34`	`[bool]$quantize`
`35`	`35`	`)`
`36`	`36`
`37`		`- if $(quantize) {`
	`37`	`+ if ($quantize) {`
`38`	`38`	`python -m examples.xnnpack.aot_compiler --model_name="${MODEL_NAME}" --delegate --quantize \| Write-Host`
`39`	`39`	`$modelFile = "$($modelName)_xnnpack_q8.pte"`
`40`	`40`	`} else {`