software-mansion
diff --git a/‎apps/typegpu-docs/astro.config.mjs‎
Lines changed: 5 additions & 1 deletion b/‎apps/typegpu-docs/astro.config.mjs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎apps/typegpu-docs/package.json‎
Lines changed: 3 additions & 1 deletion b/‎apps/typegpu-docs/package.json‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎apps/typegpu-docs/public/assets/background-segmentation/u2netp.onnx‎
4.36 MB b/‎apps/typegpu-docs/public/assets/background-segmentation/u2netp.onnx‎
4.36 MB
diff --git a/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/index.html‎
Lines changed: 7 additions & 0 deletions b/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/index.html‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/index.ts‎
Lines changed: 331 additions & 0 deletions b/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/index.ts‎
Lines changed: 331 additions & 0 deletions
diff --git a/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/meta.json‎
Lines changed: 5 additions & 0 deletions b/‎apps/typegpu-docs/src/examples/image-processing/background-segmentation/meta.json‎
Lines changed: 5 additions & 0 deletions
@@ -46,7 +46,10 @@ export default defineConfig({
       'process.env.NODE_DEBUG_NATIVE': '""',
     },
     optimizeDeps: {
-      exclude: ['@rolldown/browser'],
+      exclude: [
+        '@rolldown/browser',
+        'onnxruntime-web',
+      ],
     },
     // Allowing query params, for invalidation
     plugins: [
@@ -65,6 +68,7 @@ export default defineConfig({
       noExternal: [
         'wgsl-wasm-transpiler-bundler',
         '@rolldown/browser',
+        'onnxruntime-web',
       ],
     },
   },
 
@@ -38,11 +38,13 @@
     "fuse.js": "catalog:frontend",
     "jotai": "^2.15.0",
     "jotai-location": "^0.6.2",
+    "lodash": "^4.17.21",
     "lucide-react": "^0.536.0",
     "lz-string": "^1.5.0",
     "monaco-editor": "^0.53.0",
     "morphcharts": "^1.3.2",
     "motion": "^12.23.24",
+    "onnxruntime-web": "1.23.0-dev.20250917-21fbad8a65",
     "pathe": "^2.0.3",
     "react": "^19.1.0",
     "react-dom": "^19.1.0",
@@ -66,8 +68,8 @@
     "@types/babel__standalone": "^7.1.9",
     "@types/babel__template": "^7.4.4",
     "@types/babel__traverse": "^7.20.7",
-    "@types/node": "^24.7.0",
     "@types/dom-mediacapture-record": "^1.0.22",
+    "@types/node": "^24.7.0",
     "@vitejs/plugin-basic-ssl": "^2.1.0",
     "@webgpu/types": "catalog:types",
     "astro-vtbot": "^2.1.6",
 
@@ -0,0 +1,7 @@
+<canvas></canvas>
+<video
+  autoplay
+  playsinline
+  class="absolute top-0 left-0 w-px h-px opacity-0 pointer-events-none"
+>
+</video>
@@ -0,0 +1,331 @@
+import tgpu, {
+  type RenderFlag,
+  type SampledFlag,
+  type StorageFlag,
+  type TgpuBindGroup,
+  type TgpuTexture,
+} from 'typegpu';
+import { fullScreenTriangle } from 'typegpu/common';
+import * as d from 'typegpu/data';
+import { MODEL_HEIGHT, MODEL_WIDTH, prepareSession } from './model.ts';
+import {
+  blockDim,
+  blurLayout,
+  drawWithMaskLayout,
+  generateMaskLayout,
+  prepareModelInputLayout,
+  sampleBiasSlot,
+  useGaussianSlot,
+} from './schemas.ts';
+import {
+  computeFn,
+  drawWithMaskFragment,
+  generateMaskFromOutput,
+  prepareModelInput,
+} from './shaders.ts';
+
+// Background segmentation uses the u2netp model (https://github.com/xuebinqin/U-2-Net)
+// by Xuebin Qin et al., licensed under the Apache License 2.0 (https://www.apache.org/licenses/LICENSE-2.0)
+
+// We need to wait for issue to close and release: https://github.com/microsoft/onnxruntime/issues/26480
+if (/^((?!chrome|android).)*safari/i.test(navigator.userAgent)) {
+  throw new Error('Unfortunately, ONNX does not work on Safari or iOS yet.');
+}
+
+// setup
+
+const canvas = document.querySelector('canvas') as HTMLCanvasElement;
+const video = document.querySelector('video') as HTMLVideoElement;
+
+if (navigator.mediaDevices.getUserMedia) {
+  video.srcObject = await navigator.mediaDevices.getUserMedia({
+    video: {
+      facingMode: 'user',
+      width: { ideal: 1280 },
+      height: { ideal: 720 },
+      frameRate: { ideal: 60 },
+    },
+  });
+} else {
+  throw new Error('getUserMedia not supported');
+}
+
+const adapter = await navigator.gpu?.requestAdapter();
+const device = await adapter?.requestDevice() as GPUDevice;
+
+if (!device || !adapter) {
+  throw new Error('Failed to initialize device.');
+}
+
+// monkey patching ONNX: https://github.com/microsoft/onnxruntime/issues/26107
+const oldRequestAdapter = navigator.gpu.requestAdapter;
+const oldRequestDevice = adapter.requestDevice;
+navigator.gpu.requestAdapter = async () => adapter;
+adapter.requestDevice = async () => device;
+const root = await tgpu.initFromDevice({ device });
+const context = canvas.getContext('webgpu') as GPUCanvasContext;
+const presentationFormat = navigator.gpu.getPreferredCanvasFormat();
+
+context.configure({
+  device,
+  format: presentationFormat,
+  alphaMode: 'premultiplied',
+});
+
+// resources
+
+let blurStrength = 5;
+let useGaussianBlur = false;
+
+const zeroBuffer = root.createBuffer(d.u32, 0).$usage('uniform');
+const oneBuffer = root.createBuffer(d.u32, 1).$usage('uniform');
+const useGaussianUniform = root.createUniform(d.u32, 0);
+const sampleBiasUniform = root.createUniform(d.f32, 0);
+
+const sampler = root['~unstable'].createSampler({
+  magFilter: 'linear',
+  minFilter: 'linear',
+  mipmapFilter: 'linear',
+});
+
+const maskTexture = root['~unstable'].createTexture({
+  size: [MODEL_WIDTH, MODEL_HEIGHT],
+  format: 'rgba8unorm',
+  dimension: '2d',
+}).$usage('sampled', 'render', 'storage');
+
+const modelInputBuffer = root
+  .createBuffer(d.arrayOf(d.f32, 3 * MODEL_WIDTH * MODEL_HEIGHT))
+  .$usage('storage');
+
+const modelOutputBuffer = root
+  .createBuffer(d.arrayOf(d.f32, 1 * MODEL_WIDTH * MODEL_HEIGHT))
+  .$usage('storage');
+
+let blurredTextures: (
+  & TgpuTexture<{
+    size: [number, number];
+    format: 'rgba8unorm';
+    mipLevelCount: 10;
+  }>
+  & StorageFlag
+  & SampledFlag
+  & RenderFlag
+)[];
+
+const generateMaskBindGroup = root.createBindGroup(generateMaskLayout, {
+  maskTexture,
+  outputBuffer: modelOutputBuffer,
+});
+
+let blurBindGroups: TgpuBindGroup<typeof blurLayout.entries>[];
+
+// pipelines
+
+const prepareModelInputPipeline = root['~unstable']
+  .createGuardedComputePipeline(
+    prepareModelInput,
+  );
+
+const session = await prepareSession(
+  root.unwrap(modelInputBuffer),
+  root.unwrap(modelOutputBuffer),
+);
+
+const generateMaskFromOutputPipeline = root['~unstable']
+  .createGuardedComputePipeline(
+    generateMaskFromOutput,
+  );
+
+const blurPipeline = root['~unstable']
+  .withCompute(computeFn)
+  .createPipeline();
+
+const drawWithMaskPipeline = root['~unstable']
+  .with(useGaussianSlot, useGaussianUniform)
+  .with(sampleBiasSlot, sampleBiasUniform)
+  .withVertex(fullScreenTriangle, {})
+  .withFragment(drawWithMaskFragment, { format: presentationFormat })
+  .createPipeline();
+
+// recalculating mask
+
+let calculateMaskCallbackId: number | undefined;
+
+async function processCalculateMask() {
+  if (video.readyState < 2) {
+    calculateMaskCallbackId = video.requestVideoFrameCallback(
+      processCalculateMask,
+    );
+    return;
+  }
+
+  prepareModelInputPipeline
+    .with(root.createBindGroup(prepareModelInputLayout, {
+      inputTexture: device.importExternalTexture({ source: video }),
+      outputBuffer: modelInputBuffer,
+      sampler,
+    }))
+    .dispatchThreads(MODEL_WIDTH, MODEL_HEIGHT);
+
+  await session.run();
+
+  generateMaskFromOutputPipeline
+    .with(generateMaskBindGroup)
+    .dispatchThreads(MODEL_WIDTH, MODEL_HEIGHT);
+
+  calculateMaskCallbackId = video.requestVideoFrameCallback(
+    processCalculateMask,
+  );
+}
+calculateMaskCallbackId = video.requestVideoFrameCallback(processCalculateMask);
+
+// frame
+
+function onVideoChange(size: { width: number; height: number }) {
+  const aspectRatio = size.width / size.height;
+  video.style.height = `${video.clientWidth / aspectRatio}px`;
+  if (canvas.parentElement) {
+    canvas.parentElement.style.aspectRatio = `${aspectRatio}`;
+    canvas.parentElement.style.height =
+      `min(100cqh, calc(100cqw/(${aspectRatio})))`;
+  }
+  blurredTextures = [0, 1].map(() =>
+    root['~unstable'].createTexture({
+      size: [size.width, size.height],
+      format: 'rgba8unorm',
+      dimension: '2d',
+      mipLevelCount: 10,
+    }).$usage('sampled', 'render', 'storage')
+  );
+  blurBindGroups = [
+    root.createBindGroup(blurLayout, {
+      flip: zeroBuffer,
+      inTexture: blurredTextures[0],
+      outTexture: blurredTextures[1].createView(
+        d.textureStorage2d('rgba8unorm', 'read-only'),
+        { mipLevelCount: 1 },
+      ),
+      sampler,
+    }),
+    root.createBindGroup(blurLayout, {
+      flip: oneBuffer,
+      inTexture: blurredTextures[1],
+      outTexture: blurredTextures[0].createView(
+        d.textureStorage2d('rgba8unorm', 'read-only'),
+        { mipLevelCount: 1 },
+      ),
+      sampler,
+    }),
+  ];
+}
+
+let videoFrameCallbackId: number | undefined;
+let lastFrameSize: { width: number; height: number } | undefined;
+
+async function processVideoFrame(
+  _: number,
+  metadata: VideoFrameCallbackMetadata,
+) {
+  if (video.readyState < 2) {
+    videoFrameCallbackId = video.requestVideoFrameCallback(processVideoFrame);
+    return;
+  }
+
+  const frameWidth = metadata.width;
+  const frameHeight = metadata.height;
+
+  if (
+    !lastFrameSize ||
+    lastFrameSize.width !== frameWidth ||
+    lastFrameSize.height !== frameHeight
+  ) {
+    lastFrameSize = { width: frameWidth, height: frameHeight };
+    onVideoChange(lastFrameSize);
+  }
+
+  blurredTextures[0].write(video);
+
+  if (useGaussianBlur) {
+    for (const _ of Array(blurStrength * 2)) {
+      blurPipeline
+        .with(blurBindGroups[0])
+        .dispatchWorkgroups(
+          Math.ceil(frameWidth / blockDim),
+          Math.ceil(frameHeight / 4),
+        );
+      blurPipeline
+        .with(blurBindGroups[1])
+        .dispatchWorkgroups(
+          Math.ceil(frameHeight / blockDim),
+          Math.ceil(frameWidth / 4),
+        );
+    }
+  } else {
+    blurredTextures[0].generateMipmaps();
+  }
+
+  drawWithMaskPipeline
+    .withColorAttachment({
+      view: context.getCurrentTexture().createView(),
+      clearValue: [1, 1, 1, 1],
+      loadOp: 'clear',
+      storeOp: 'store',
+    })
+    .with(root.createBindGroup(drawWithMaskLayout, {
+      inputTexture: device.importExternalTexture({ source: video }),
+      inputBlurredTexture: blurredTextures[0],
+      maskTexture,
+      sampler,
+    }))
+    .draw(3);
+
+  videoFrameCallbackId = video.requestVideoFrameCallback(processVideoFrame);
+}
+videoFrameCallbackId = video.requestVideoFrameCallback(processVideoFrame);
+
+// #region Example controls & Cleanup
+
+export const controls = {
+  'blur type': {
+    initial: 'mipmaps',
+    options: ['mipmaps', 'gaussian'],
+    async onSelectChange(value: string) {
+      useGaussianBlur = value === 'gaussian';
+      useGaussianUniform.write(useGaussianBlur ? 1 : 0);
+    },
+  },
+  'blur strength': {
+    initial: blurStrength,
+    min: 0,
+    max: 10,
+    step: 1,
+    onSliderChange(newValue: number) {
+      blurStrength = newValue;
+      sampleBiasUniform.write(blurStrength);
+    },
+  },
+};
+
+export function onCleanup() {
+  if (videoFrameCallbackId !== undefined) {
+    video.cancelVideoFrameCallback(videoFrameCallbackId);
+  }
+  if (calculateMaskCallbackId !== undefined) {
+    video.cancelVideoFrameCallback(calculateMaskCallbackId);
+  }
+  session.release();
+  if (video.srcObject) {
+    for (const track of (video.srcObject as MediaStream).getTracks()) {
+      track.stop();
+    }
+  }
+  navigator.gpu.requestAdapter = oldRequestAdapter;
+  if (adapter) {
+    adapter.requestDevice = oldRequestDevice;
+  }
+
+  root.destroy();
+}
+
+// #endregion
@@ -0,0 +1,5 @@
+{
+  "title": "Background Segmentation",
+  "category": "image-processing",
+  "tags": ["experimental", "camera", "onnx"]
+}