pytorch
diff --git a/‎.ci/scripts/build-mediatek-sdk.sh‎
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/build-mediatek-sdk.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.ci/scripts/test_llama_lora.sh‎
Lines changed: 96 additions & 0 deletions b/‎.ci/scripts/test_llama_lora.sh‎
Lines changed: 96 additions & 0 deletions
diff --git a/‎.github/workflows/pull.yml‎
Lines changed: 30 additions & 0 deletions b/‎.github/workflows/pull.yml‎
Lines changed: 30 additions & 0 deletions
diff --git a/‎CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion b/‎CMakeLists.txt‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎backends/arm/test/ops/test_abs.py‎
Lines changed: 23 additions & 0 deletions b/‎backends/arm/test/ops/test_abs.py‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎backends/arm/test/ops/test_acosh.py‎
Lines changed: 25 additions & 0 deletions b/‎backends/arm/test/ops/test_acosh.py‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎backends/arm/test/ops/test_adaptive_avg_pool2d.py‎
Lines changed: 29 additions & 0 deletions b/‎backends/arm/test/ops/test_adaptive_avg_pool2d.py‎
Lines changed: 29 additions & 0 deletions
diff --git a/‎backends/arm/test/ops/test_addmm.py‎
Lines changed: 27 additions & 0 deletions b/‎backends/arm/test/ops/test_addmm.py‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎backends/arm/test/ops/test_alias_copy.py‎
Lines changed: 27 additions & 0 deletions b/‎backends/arm/test/ops/test_alias_copy.py‎
Lines changed: 27 additions & 0 deletions
@@ -14,9 +14,9 @@ build_neuron_backend() {
   export NEURON_BUFFER_ALLOCATOR_LIB=${MEDIATEK_SDK_ROOT}/libneuron_buffer_allocator.so
   export EXECUTORCH_ROOT="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")/../.." && pwd)"
 
-
   cd ${EXECUTORCH_ROOT}
   ./backends/mediatek/scripts/mtk_build.sh
+  ./examples/mediatek/mtk_build_examples.sh
 }
 
 build_neuron_backend
@@ -0,0 +1,96 @@
+#!/bin/bash
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+set -exu
+# shellcheck source=/dev/null
+source "$(dirname "${BASH_SOURCE[0]}")/utils.sh"
+
+cmake_install_executorch_libraries() {
+    echo "Installing libexecutorch.a, libextension_module.so, libportable_ops_lib.a"
+    rm -rf cmake-out
+    retry cmake --preset llm \
+        -DCMAKE_INSTALL_PREFIX=cmake-out \
+        -DCMAKE_BUILD_TYPE=Release
+    cmake --build cmake-out -j9 --target install --config Release
+}
+
+cmake_build_llama_runner() {
+    echo "Building llama runner"
+    pushd extension/llm/tokenizers
+    echo "Updating tokenizers submodule"
+    git submodule update --init
+    popd
+    dir="examples/models/llama"
+    retry cmake \
+        -DBUILD_TESTING=OFF \
+        -DCMAKE_INSTALL_PREFIX=cmake-out \
+        -DCMAKE_BUILD_TYPE=Release \
+        -Bcmake-out/${dir} \
+        ${dir}
+    cmake --build cmake-out/${dir} -j9 --config Release
+}
+
+cleanup_files() {
+  echo "Deleting downloaded and generated files"
+  rm -rf "${DOWNLOADED_PATH}/"
+  rm result.txt
+}
+
+# Download model artifacts from HF Hub.
+# Hosting in personal repo for now.
+HF_MODEL_REPO="lucylq/llama3_1B_lora"
+DOWNLOADED_PATH=$(
+  bash "$(dirname "${BASH_SOURCE[0]}")/download_hf_hub.sh" \
+    --model_id "${HF_MODEL_REPO}" \
+    --files "adapter_config.json" "adapter_model.pt" "consolidated.00.pth" "params.json" "tokenizer.model"
+)
+EXPORTED_MODEL_NAME="llama_3_2_1B_lora.pte"
+# Export model.
+$PYTHON_EXECUTABLE -m extension.llm.export.export_llm \
+    base.checkpoint="${DOWNLOADED_PATH}/consolidated.00.pth" \
+    base.params="${DOWNLOADED_PATH}/params.json" \
+    base.adapter_checkpoint="${DOWNLOADED_PATH}/adapter_model.pt" \
+    base.adapter_config="${DOWNLOADED_PATH}/adapter_config.json" \
+    base.tokenizer_path="${DOWNLOADED_PATH}/tokenizer.model" \
+    model.use_kv_cache=true \
+    model.use_sdpa_with_kv_cache=true \
+    model.dtype_override="fp32" \
+    backend.xnnpack.enabled=true \
+    backend.xnnpack.extended_ops=true \
+    export.output_name="${EXPORTED_MODEL_NAME}"
+
+# Build llama runner.
+cmake_install_executorch_libraries
+cmake_build_llama_runner
+
+PROMPT="What happens if you eat watermelon seeds?"
+# Run llama runner
+RUNTIME_ARGS="--model_path=${EXPORTED_MODEL_NAME} --tokenizer_path=${DOWNLOADED_PATH}/tokenizer.model --temperature=0 --seq_len=20 --warmup=1"
+
+NOW=$(date +"%H:%M:%S")
+echo "Starting to run llama runner at ${NOW}"
+# shellcheck source=/dev/null
+cmake-out/examples/models/llama/llama_main --prompt="${PROMPT}" ${RUNTIME_ARGS} > result.txt
+NOW=$(date +"%H:%M:%S")
+echo "Finished at ${NOW}"
+
+RESULT=$(cat result.txt)
+EXPECTED_PREFIX="What happens if you eat watermelon seeds? Watermelon seeds are a good source of vitamin C,"
+
+if [[ "${RESULT}" == "${EXPECTED_PREFIX}"* ]]; then
+  echo "Expected result prefix: ${EXPECTED_PREFIX}"
+  echo "Actual result: ${RESULT}"
+  echo "Success"
+  cleanup_files
+else
+  echo "Expected result prefix: ${EXPECTED_PREFIX}"
+  echo "Actual result: ${RESULT}"
+  echo "Failure; results not the same"
+
+  cleanup_files
+  exit 1
+fi
@@ -687,6 +687,36 @@ jobs:
         # run llama runner in eager mode
         PYTHON_EXECUTABLE=python bash .ci/scripts/test_llama_runner_eager.sh
 
+  test-llama-lora-linux:
+    name: test-llama-lora-linux
+    uses: pytorch/test-infra/.github/workflows/linux_job_v2.yml@main
+    permissions:
+      id-token: write
+      contents: read
+    strategy:
+      fail-fast: false
+    with:
+      runner: linux.24xlarge
+      docker-image: ci-image:executorch-ubuntu-22.04-clang12
+      submodules: 'recursive'
+      ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
+      timeout: 90
+      script: |
+        # The generic Linux job chooses to use base env, not the one setup by the image
+        CONDA_ENV=$(conda env list --json | jq -r ".envs | .[-1]")
+        conda activate "${CONDA_ENV}"
+
+        PYTHON_EXECUTABLE=python bash .ci/scripts/setup-linux.sh --build-tool "cmake"
+
+        # Install llama requirements
+        bash examples/models/llama/install_requirements.sh
+
+        # install a recent version of torchtune.
+        PYTHON_EXECUTABLE=python python -m pip install torchtune==0.7.0.dev20250730  --extra-index-url https://download.pytorch.org/whl/nightly/cpu
+
+        # run llama runner in eager mode
+        PYTHON_EXECUTABLE=python bash .ci/scripts/test_llama_lora.sh
+
   test-mediatek-models-linux:
     name: test-mediatek-models-linux
     uses: pytorch/test-infra/.github/workflows/linux_job_v2.yml@main
 
@@ -849,7 +849,7 @@ if(NOT EXECUTORCH_SELECT_OPS_YAML STREQUAL ""
     LIB_NAME
     "executorch_selected_kernels"
     OPS_SCHEMA_YAML
-    "${EXECUTORCH_SELECT_OPS_LIB}"
+    "${EXECUTORCH_SELECT_OPS_YAML}"
     ROOT_OPS
     "${EXECUTORCH_SELECT_OPS_LIST}"
     INCLUDE_ALL_OPS
 
@@ -15,6 +15,7 @@
     EthosU85PipelineINT,
     TosaPipelineFP,
     TosaPipelineINT,
+    VgfPipeline,
 )
 
 aten_op = "torch.ops.aten.abs.default"
@@ -66,3 +67,25 @@ def test_abs_u85_INT(test_data: torch.Tensor):
         Abs(), test_data(), aten_op, exir_op, run_on_fvp=True
     )
     pipeline.run()
+
+
+@common.parametrize("test_data", Abs.test_parameters)
+@common.SkipIfNoModelConverter
+def test_abs_vgf_FP(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        Abs(), test_data(), aten_op, exir_op, tosa_version="TOSA-1.0+FP"
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_data", Abs.test_parameters)
+@common.SkipIfNoModelConverter
+def test_abs_vgf_INT(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        Abs(),
+        test_data(),
+        aten_op,
+        exir_op,
+        tosa_version="TOSA-1.0+INT",
+    )
+    pipeline.run()
@@ -14,6 +14,7 @@
     EthosU85PipelineINT,
     TosaPipelineFP,
     TosaPipelineINT,
+    VgfPipeline,
 )
 
 input_t = Tuple[torch.Tensor]  # Input x
@@ -112,3 +113,27 @@ def test_acosh_u85_INT_xfail(test_data: Tuple):
         run_on_fvp=False,
     )
     pipeline.run()
+
+
+@common.parametrize("test_data", test_data_suite)
+@common.SkipIfNoModelConverter
+def test_acosh_vgf_FP(test_data: Tuple):
+    pipeline = VgfPipeline[input_t](
+        Acosh(),
+        (test_data(),),
+        aten_op,
+        tosa_version="TOSA-1.0+FP",
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_data", test_data_suite)
+@common.SkipIfNoModelConverter
+def test_acosh_vgf_INT(test_data: Tuple):
+    pipeline = VgfPipeline[input_t](
+        Acosh(),
+        (test_data(),),
+        aten_op,
+        tosa_version="TOSA-1.0+INT",
+    )
+    pipeline.run()
@@ -14,6 +14,7 @@
     EthosU85PipelineINT,
     TosaPipelineFP,
     TosaPipelineINT,
+    VgfPipeline,
 )
 
 exir_op = "executorch_exir_dialects_edge__ops_aten_avg_pool2d_default"
@@ -161,3 +162,31 @@ def test_adaptive_avg_pool2d_u85_INT(test_module):
         exir_ops=exir_op,
     )
     pipeline.run()
+
+
+@common.parametrize("test_module", test_modules)
+@common.SkipIfNoModelConverter
+def test_adaptive_avg_pool2d_vgf_FP(test_module):
+    model, input_tensor = test_module()
+    pipeline = VgfPipeline[input_t](
+        model,
+        input_tensor,
+        [],
+        exir_op,
+        tosa_version="TOSA-1.0+FP",
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_module", test_modules)
+@common.SkipIfNoModelConverter
+def test_adaptive_avg_pool2d_vgf_INT(test_module):
+    model, input_tensor = test_module()
+    pipeline = VgfPipeline[input_t](
+        model,
+        input_tensor,
+        [],
+        exir_op,
+        tosa_version="TOSA-1.0+INT",
+    )
+    pipeline.run()
@@ -13,6 +13,7 @@
     EthosU85PipelineINT,
     TosaPipelineFP,
     TosaPipelineINT,
+    VgfPipeline,
 )
 
 aten_op = "torch.ops.aten.addmm.default"
@@ -155,3 +156,29 @@ def test_addmm_u85_INT(test_data: Tuple):
         exir_ops=exir_op,
     )
     pipeline.run()
+
+
+@common.parametrize("test_data", test_data_suite)
+@common.SkipIfNoModelConverter
+def test_addmm_vgf_FP(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        Addmm(),
+        (*test_data,),
+        aten_op=aten_op,
+        exir_op=exir_op,
+        tosa_version="TOSA-1.0+FP",
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_data", test_data_suite)
+@common.SkipIfNoModelConverter
+def test_addmm_vgf_INT(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        Addmm(),
+        (*test_data,),
+        aten_op=[],
+        exir_op=exir_op,
+        tosa_version="TOSA-1.0+INT",
+    )
+    pipeline.run()
@@ -12,6 +12,7 @@
     EthosU85PipelineINT,
     TosaPipelineFP,
     TosaPipelineINT,
+    VgfPipeline,
 )
 
 input_t1 = Tuple[torch.Tensor]
@@ -83,3 +84,29 @@ def test_alias_u85_INT(test_data: input_t1):
         AliasCopy.aten_op,
         AliasCopy.exir_op,
     ).run()
+
+
+@common.parametrize("test_data", AliasCopy.test_data)
+@common.SkipIfNoModelConverter
+def test_alias_vgf_FP(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        AliasCopy(),
+        test_data(),
+        AliasCopy.aten_op,
+        AliasCopy.exir_op,
+        tosa_version="TOSA-1.0+FP",
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_data", AliasCopy.test_data)
+@common.SkipIfNoModelConverter
+def test_alias_vgf_INT(test_data: input_t1):
+    pipeline = VgfPipeline[input_t1](
+        AliasCopy(),
+        test_data(),
+        AliasCopy.aten_op,
+        AliasCopy.exir_op,
+        tosa_version="TOSA-1.0+INT",
+    )
+    pipeline.run()
Original file line number	Diff line number	Diff line change
`@@ -14,9 +14,9 @@ build_neuron_backend() {`
`14`	`14`	`export NEURON_BUFFER_ALLOCATOR_LIB=${MEDIATEK_SDK_ROOT}/libneuron_buffer_allocator.so`
`15`	`15`	`export EXECUTORCH_ROOT="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")/../.." && pwd)"`
`16`	`16`
`17`		`-`
`18`	`17`	`cd ${EXECUTORCH_ROOT}`
`19`	`18`	`./backends/mediatek/scripts/mtk_build.sh`
	`19`	`+ ./examples/mediatek/mtk_build_examples.sh`
`20`	`20`	`}`
`21`	`21`
`22`	`22`	`build_neuron_backend`