update about onnx runtime's fallback behavior

zhen9910 · zhen9910 · commit 163c6a88972b · 2026-01-14T23:01:52.000-08:00
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/crates/wasi-nn/Cargo.toml b/crates/wasi-nn/Cargo.toml
@@ -72,6 +72,8 @@ onnx = ["dep:ort"]
 onnx-download = ["onnx", "ort/download-binaries"]
 # CUDA execution provider for NVIDIA GPU support (requires CUDA toolkit)
 onnx-cuda = ["onnx", "ort/cuda"]
+# Enable tracing for ONNX Runtime
+ort-tracing = ["onnx", "ort/tracing"]
 # WinML is only available on Windows 10 1809 and later.
 winml = ["dep:windows"]
 # PyTorch is available on all platforms; requires Libtorch to be installed
diff --git a/crates/wasi-nn/examples/classification-component-onnx/README.md b/crates/wasi-nn/examples/classification-component-onnx/README.md
@@ -12,7 +12,11 @@ GPU execution target only supports Nvidia CUDA (onnx-cuda) as execution provider
 
 In this directory, run the following command to build the WebAssembly component:
 ```console
+# build component for target wasm32-wasip1
 cargo component build
+
+# build component for target wasm32-wasip2
+cargo component build --target wasm32-wasip2
 ```
 
 ## Running the Example
@@ -44,7 +48,7 @@ Arguments:
 ./target/debug/wasmtime run \
     -Snn \
     --dir ./crates/wasi-nn/examples/classification-component-onnx/fixture/::fixture \
-    ./crates/wasi-nn/examples/classification-component-onnx/target/wasm32-wasip1/debug/classification-component-onnx.wasm
+    ./crates/wasi-nn/examples/classification-component-onnx/target/wasm32-wasip2/debug/classification-component-onnx.wasm
 ```
 
 #### GPU (CUDA) Execution:
@@ -55,7 +59,7 @@ export LD_LIBRARY_PATH={wasmtime_workspace}/target/debug
 ./target/debug/wasmtime run \
     -Snn \
     --dir ./crates/wasi-nn/examples/classification-component-onnx/fixture/::fixture \
-    ./crates/wasi-nn/examples/classification-component-onnx/target/wasm32-wasip1/debug/classification-component-onnx.wasm \
+    ./crates/wasi-nn/examples/classification-component-onnx/target/wasm32-wasip2/debug/classification-component-onnx.wasm \
     gpu
 
 ```
@@ -79,7 +83,31 @@ Index: n02102318 cocker spaniel, English cocker spaniel, cocker - Probability: 0
 When using GPU target, the first line will indicate the selected execution target.
 You can monitor GPU usage using cmd `watch -n 1 nvidia-smi`.
 
+To see trace logs from `wasmtime_wasi_nn` or `ort`, run Wasmtime with `WASMTIME_LOG` enabled, e.g.,
+
+```sh
+WASMTIME_LOG=wasmtime_wasi_nn=warn ./target/debug/wasmtime run ...
+WASMTIME_LOG=ort=warn ./target/debug/wasmtime run ...
+```
+
 ## Prerequisites for GPU(CUDA) Support
 - NVIDIA GPU with CUDA support
 - CUDA Toolkit 12.x with cuDNN 9.x
 - Build wasmtime with `wasmtime-wasi-nn/onnx-cuda` feature
+
+## ONNX Runtime's Fallback Behavior
+
+If the GPU execution provider is requested (by passing `gpu`) but the device does not have a GPU or the necessary CUDA drivers are missing, ONNX Runtime will **silently fall back** to the CPU execution provider. The application will continue to run, but inference will happen on the CPU.
+
+To verify if fallback is happening, you can enable ONNX Runtime logging:
+
+1. Build Wasmtime with the additional `wasmtime-wasi-nn/ort-tracing` feature:
+   ```sh
+   cargo build --features component-model,wasi-nn,wasmtime-wasi-nn/onnx-cuda,wasmtime-wasi-nn/ort-tracing
+   ```
+
+2. Run Wasmtime with `WASMTIME_LOG` enabled to see `ort` warnings:
+   ```sh
+   WASMTIME_LOG=ort=warn ./target/debug/wasmtime run ...
+   ```
+   You should see a warning like: `No execution providers from session options registered successfully; may fall back to CPU.`
diff --git a/crates/wasi-nn/src/backend/onnx.rs b/crates/wasi-nn/src/backend/onnx.rs
@@ -68,18 +68,18 @@ fn configure_execution_providers(
             #[cfg(feature = "onnx-cuda")]
             {
                 // Use CUDA execution provider for GPU acceleration
-                tracing::debug!("Configuring ONNX Nvidia CUDA execution provider for GPU target");
+                tracing::debug!("Using ONNX runtime's Nvidia GPU CUDA execution provider");
                 Ok(vec![CUDAExecutionProvider::default().build()])
             }
             #[cfg(not(feature = "onnx-cuda"))]
             {
-                Err(BackendError::BackendAccess(wasmtime::format_err!(
-                    "GPU execution target is requested, but 'onnx-cuda' feature is not enabled"
-                )))
+                tracing::warn!("ONNX runtime GPU CUDA execution provider is not enabled, falling back to CPU");
+                Ok(vec![CPUExecutionProvider::default().build()])
             }
         }
         ExecutionTarget::Tpu => {
-            unimplemented!("TPU execution target is not supported for ONNX backend yet");
+            tracing::warn!("TPU execution target is not supported for ONNX backend yet, falling back to CPU");
+            Ok(vec![CPUExecutionProvider::default().build()])
         }
     }
 }

Original file line number	Diff line number	Diff line change
`@@ -68,18 +68,18 @@ fn configure_execution_providers(`
`68`	`68`	`#[cfg(feature = "onnx-cuda")]`
`69`	`69`	`{`
`70`	`70`	`// Use CUDA execution provider for GPU acceleration`
`71`		`- tracing::debug!("Configuring ONNX Nvidia CUDA execution provider for GPU target");`
	`71`	`+ tracing::debug!("Using ONNX runtime's Nvidia GPU CUDA execution provider");`
`72`	`72`	`Ok(vec![CUDAExecutionProvider::default().build()])`
`73`	`73`	`}`
`74`	`74`	`#[cfg(not(feature = "onnx-cuda"))]`
`75`	`75`	`{`
`76`		`- Err(BackendError::BackendAccess(wasmtime::format_err!(`
`77`		`- "GPU execution target is requested, but 'onnx-cuda' feature is not enabled"`
`78`		`- )))`
	`76`	`+ tracing::warn!("ONNX runtime GPU CUDA execution provider is not enabled, falling back to CPU");`
	`77`	`+ Ok(vec![CPUExecutionProvider::default().build()])`
`79`	`78`	`}`
`80`	`79`	`}`
`81`	`80`	`ExecutionTarget::Tpu => {`
`82`		`- unimplemented!("TPU execution target is not supported for ONNX backend yet");`
	`81`	`+ tracing::warn!("TPU execution target is not supported for ONNX backend yet, falling back to CPU");`
	`82`	`+ Ok(vec![CPUExecutionProvider::default().build()])`
`83`	`83`	`}`
`84`	`84`	`}`
`85`	`85`	`}`