deploy: d95709e

jcggl · jcggl · commit ff7249896904 · 2026-03-05T08:12:10.000Z
diff --git a/.well-known/agent-card.json b/.well-known/agent-card.json
@@ -3,7 +3,7 @@
   "name": "AnimaSync",
   "description": "Voice-driven 3D avatar animation engine for the browser. Extracts emotion from speech and generates lip sync, facial expressions, and body motion in real time — entirely client-side via Rust/WASM and ONNX inference.",
   "url": "https://animasync.quasar.ggls.dev/",
-  "version": "0.4.3",
+  "version": "0.4.4",
   "provider": {
     "organization": "GoodGang Labs",
     "url": "https://goodganglabs.com"
diff --git a/.well-known/ai-catalog.json b/.well-known/ai-catalog.json
@@ -46,15 +46,15 @@
   ],
   "packages": {
     "npm": [
-      {
-        "name": "@goodganglabs/lipsync-wasm-v2",
-        "description": "V2 engine — 52-dim ARKit blendshapes via student distillation. Recommended for most projects.",
-        "url": "https://www.npmjs.com/package/@goodganglabs/lipsync-wasm-v2"
-      },
       {
         "name": "@goodganglabs/lipsync-wasm-v1",
-        "description": "V1 engine — 111-dim ARKit blendshapes via phoneme classification. Full expression control.",
+        "description": "V1 engine — 111-dim ARKit blendshapes via phoneme classification. Recommended for most projects.",
         "url": "https://www.npmjs.com/package/@goodganglabs/lipsync-wasm-v1"
+      },
+      {
+        "name": "@goodganglabs/lipsync-wasm-v2",
+        "description": "V2 engine — 52-dim ARKit blendshapes via student distillation. Lightweight alternative.",
+        "url": "https://www.npmjs.com/package/@goodganglabs/lipsync-wasm-v2"
       }
     ]
   },
diff --git a/README.md b/README.md
@@ -80,7 +80,7 @@ Most lip sync engines stop at mouth shapes. AnimaSync goes further — it treats
 | **Lip Sync** | Mouth shapes matching phonemes | ONNX inference → ARKit blendshapes (jaw, mouth, tongue) |
 | **Facial Expression** | Emotion-driven brows, cheeks, eyes | Voice energy & pitch → expression mapping + anatomical constraints |
 | **Eye Animation** | Natural blinks, micro-movements | Stochastic blink injection (2.5–4.5s intervals, 15% double-blink) |
-| **Body Motion** | Idle breathing, speaking gestures | Embedded VRMA bone clips with automatic idle ↔ speaking crossfade |
+| **Body Motion** | Idle breathing, speaking gestures | Embedded VRMA bone clips with LoopPingPong idle + asymmetric crossfade (0.8s in, 1.0s out) |
 
 One audio stream in → a fully animated 3D avatar out.
 
@@ -91,11 +91,11 @@ One audio stream in → a fully animated 3D avatar out.
 ### Install
 
 ```bash
-# V2 recommended for most use cases
-npm install @goodganglabs/lipsync-wasm-v2
-
-# V1 for full 111-dim expression control
+# V1 recommended for most use cases
 npm install @goodganglabs/lipsync-wasm-v1
+
+# V2 lightweight alternative
+npm install @goodganglabs/lipsync-wasm-v2
 ```
 
 > Peer dependency: [`onnxruntime-web`](https://www.npmjs.com/package/onnxruntime-web) >= 1.17.0
@@ -163,17 +163,17 @@ The production site is available at **[animasync.quasar.ggls.dev](https://animas
 
 ## V1 vs V2
 
-| | V2 (Recommended) | V1 (Full Control) |
+| | V1 (Recommended) | V2 (Lightweight) |
 |---|---|---|
-| **npm** | `@goodganglabs/lipsync-wasm-v2` | `@goodganglabs/lipsync-wasm-v1` |
-| **Output** | 52-dim ARKit blendshapes | 111-dim ARKit blendshapes |
-| **Model** | Student distillation (direct prediction) | Phoneme classification → viseme mapping |
-| **Post-processing** | crisp_mouth + fade + auto-blink | OneEuroFilter + anatomical constraints |
-| **Expression generation** | Blink injection in post-process | Built-in `IdleExpressionGenerator` (blinks + micro-expressions) |
-| **Voice activity** | Not included | Built-in `VoiceActivityDetector` (body pose switching) |
-| **ONNX fallback** | None (ONNX required) | Heuristic mode (energy-based) |
-| **Body motion** | VRMA idle/speaking (both versions) | VRMA idle/speaking + VAD auto-switch |
-| **Best for** | Most projects, quick integration | Full expression control, custom avatars |
+| **npm** | `@goodganglabs/lipsync-wasm-v1` | `@goodganglabs/lipsync-wasm-v2` |
+| **Output** | 111-dim ARKit blendshapes | 52-dim ARKit blendshapes |
+| **Model** | Phoneme classification → viseme mapping | Student distillation (direct prediction) |
+| **Post-processing** | OneEuroFilter + anatomical constraints | crisp_mouth + fade + auto-blink |
+| **Expression generation** | Built-in `IdleExpressionGenerator` (blinks + micro-expressions) | Blink injection in post-process |
+| **Voice activity** | Built-in `VoiceActivityDetector` (body pose switching) | Not included |
+| **ONNX fallback** | Heuristic mode (energy-based) | None (ONNX required) |
+| **Body motion** | VRMA idle/speaking + VAD auto-switch (LoopPingPong, asymmetric crossfade) | VRMA idle/speaking (LoopPingPong, asymmetric crossfade) |
+| **Best for** | Full expression control, custom avatars | Quick integration, lightweight |
 
 ---
 
diff --git a/agents.json b/agents.json
@@ -29,7 +29,7 @@
       "id": "quick-start-v2",
       "name": "Quick Start with V2 Engine",
       "description": "Install AnimaSync V2, initialize the engine, and process an audio file to get 52 ARKit blendshape animation frames at 30fps.",
-      "agent_instructions": "Use this flow when a developer wants to add lip sync animation to a web app. V2 is recommended for most use cases — simpler integration, direct 52-dim prediction.",
+      "agent_instructions": "Use this flow when a developer wants to add lip sync animation to a web app. V1 is recommended for most use cases — full expression control with built-in VAD and idle expressions.",
       "steps": [
         {
           "action": "install",
@@ -150,7 +150,7 @@
         },
         {
           "action": "init-animasync",
-          "code": "<script type=\"module\">\nconst CDN = 'https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@0.4.3';\nconst { LipSyncWasmWrapper } = await import(`${CDN}/lipsync-wasm-wrapper.js`);\nconst lipsync = new LipSyncWasmWrapper({ wasmPath: `${CDN}/lipsync_wasm_v2.js` });\nawait lipsync.init();\n</script>",
+          "code": "<script type=\"module\">\nconst CDN = 'https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@0.4.4';\nconst { LipSyncWasmWrapper } = await import(`${CDN}/lipsync-wasm-wrapper.js`);\nconst lipsync = new LipSyncWasmWrapper({ wasmPath: `${CDN}/lipsync_wasm_v2.js` });\nawait lipsync.init();\n</script>",
           "description": "Import and initialize AnimaSync V2 from CDN"
         }
       ]
diff --git a/examples/guide/index.html b/examples/guide/index.html
@@ -603,7 +603,7 @@ <h2 class="step-title">Initialize AnimaSync</h2>
             <button data-action="fold">Fold</button>
           </div>
         </div>
-        <div class="code-block"><span class="kw">const</span> CDN = <span class="str">'https://cdn.jsdelivr.net/npm/&#64;goodganglabs/lipsync-wasm-v1&#64;0.4.3'</span>;
+        <div class="code-block"><span class="kw">const</span> CDN = <span class="str">'https://cdn.jsdelivr.net/npm/&#64;goodganglabs/lipsync-wasm-v1&#64;0.4.4'</span>;
 
 <span class="kw">const</span> { <span class="fn">LipSyncWasmWrapper</span> } = <span class="kw">await</span> <span class="fn">import</span>(<span class="str">`${CDN}/lipsync-wasm-wrapper.js`</span>);
 <span class="kw">const</span> lipsync = <span class="kw">new</span> <span class="fn">LipSyncWasmWrapper</span>({ <span class="attr">wasmPath</span>: <span class="str">`${CDN}/lipsync_wasm_v1.js`</span> });
@@ -895,7 +895,7 @@ <h2 class="step-title">Add Real-time Microphone</h2>
 // ════════════════════════════════════════
 // Config
 // ════════════════════════════════════════
-const VERSION = '0.4.3';
+const VERSION = '0.4.4';
 const CDN = `https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v1@${VERSION}`;
 const ARKIT_52 = [
   'browDownLeft','browDownRight','browInnerUp','browOuterUpLeft','browOuterUpRight',
@@ -1012,11 +1012,11 @@ <h2 class="step-title">Add Real-time Microphone</h2>
       const vrmaBytes = lipsync.getVrmaBytes();
       if (vrmaBytes?.idle?.length) {
         const a = await loadVRMAFromBytes(vrmaBytes.idle);
-        if (a) { idleAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); idleAction.play(); }
+        if (a) { idleAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); idleAction.setLoop(THREE.LoopPingPong); idleAction.play(); }
       }
       if (vrmaBytes?.speaking?.length) {
         const a = await loadVRMAFromBytes(vrmaBytes.speaking);
-        if (a) { speakingAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); speakingAction.play(); speakingAction.setEffectiveWeight(0); }
+        if (a) { speakingAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); speakingAction.setLoop(THREE.LoopPingPong); speakingAction.play(); speakingAction.setEffectiveWeight(0); }
       }
     } catch (e) { console.warn('VRMA skip:', e.message); }
   }
@@ -1251,12 +1251,15 @@ <h2 class="step-title">Add Real-time Microphone</h2>
   for (const n of names) vrm.expressionManager.setValue(n, 0);
   prevFrame = null;
 }
-function transitionToSpeaking() { isSpeaking = true; crossFadeProgress = 1; }
+function transitionToSpeaking() { isSpeaking = true; }
 function transitionToIdle() { isSpeaking = false; }
 function updateBoneWeights(dt) {
-  const speed = 3.0;
-  if (isSpeaking && crossFadeProgress < 1) crossFadeProgress = Math.min(1, crossFadeProgress + dt * speed);
-  else if (!isSpeaking && crossFadeProgress > 0) crossFadeProgress = Math.max(0, crossFadeProgress - dt * speed);
+  const target = isSpeaking ? 1 : 0;
+  const duration = isSpeaking ? 0.8 : 1.0;
+  const step = dt / duration;
+  crossFadeProgress = target > crossFadeProgress
+    ? Math.min(crossFadeProgress + step, 1)
+    : Math.max(crossFadeProgress - step, 0);
   const w = crossFadeProgress * crossFadeProgress * (3 - 2 * crossFadeProgress);
   if (idleAction) idleAction.setEffectiveWeight(1 - w);
   if (speakingAction) speakingAction.setEffectiveWeight(w);
@@ -1590,11 +1593,11 @@ <h2 class="step-title">Add Real-time Microphone</h2>
     '      const vrmaBytes = lipsync.getVrmaBytes();',
     '      if (vrmaBytes?.idle?.length) {',
     '        const a = await loadVRMAFromBytes(vrmaBytes.idle);',
-    '        if (a) { idleAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); idleAction.play(); }',
+    '        if (a) { idleAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); idleAction.setLoop(THREE.LoopPingPong); idleAction.play(); }',
     '      }',
     '      if (vrmaBytes?.speaking?.length) {',
     '        const a = await loadVRMAFromBytes(vrmaBytes.speaking);',
-    '        if (a) { speakingAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); speakingAction.play(); speakingAction.setEffectiveWeight(0); }',
+    '        if (a) { speakingAction = mixer.clipAction(createVRMAnimationClip(a, vrm)); speakingAction.setLoop(THREE.LoopPingPong); speakingAction.play(); speakingAction.setEffectiveWeight(0); }',
     '      }',
     "    } catch (e) { console.warn('VRMA skip:', e.message); }",
     '  }',
@@ -1776,12 +1779,15 @@ <h2 class="step-title">Add Real-time Microphone</h2>
     '  for (const n of names) vrm.expressionManager.setValue(n, 0);',
     '  prevFrame = null;',
     '}',
-    'function transitionToSpeaking() { isSpeaking = true; crossFadeProgress = 1; }',
+    'function transitionToSpeaking() { isSpeaking = true; }',
     'function transitionToIdle() { isSpeaking = false; }',
     'function updateBoneWeights(dt) {',
-    '  const speed = 3.0;',
-    '  if (isSpeaking && crossFadeProgress < 1) crossFadeProgress = Math.min(1, crossFadeProgress + dt * speed);',
-    '  else if (!isSpeaking && crossFadeProgress > 0) crossFadeProgress = Math.max(0, crossFadeProgress - dt * speed);',
+    '  const target = isSpeaking ? 1 : 0;',
+    '  const duration = isSpeaking ? 0.8 : 1.0;',
+    '  const step = dt / duration;',
+    '  crossFadeProgress = target > crossFadeProgress',
+    '    ? Math.min(crossFadeProgress + step, 1)',
+    '    : Math.max(crossFadeProgress - step, 0);',
     '  const w = crossFadeProgress * crossFadeProgress * (3 - 2 * crossFadeProgress);',
     '  if (idleAction) idleAction.setEffectiveWeight(1 - w);',
     '  if (speakingAction) speakingAction.setEffectiveWeight(w);',
diff --git a/examples/vanilla-avatar/index.html b/examples/vanilla-avatar/index.html
@@ -199,7 +199,7 @@ <h2>52 ARKit Blendshapes — V2 Student</h2>
 // No 3D avatar, no Three.js. Pure audio → lip sync data (52-dim).
 // ================================================================
 
-const VERSION = '0.4.3';
+const VERSION = '0.4.4';
 const CDN = `https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@${VERSION}`;
 
 // ── All 52 ARKit blendshape channels ──
diff --git a/examples/vanilla-basic/index.html b/examples/vanilla-basic/index.html
@@ -199,7 +199,7 @@ <h2>52 ARKit Blendshapes — V1 Phoneme</h2>
 // No 3D avatar, no Three.js. Pure audio → lip sync + expression + blink data.
 // ================================================================
 
-const VERSION = '0.4.3';
+const VERSION = '0.4.4';
 const CDN = `https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v1@${VERSION}`;
 
 // ── All 52 ARKit blendshape channels ──
diff --git a/examples/vanilla-comparison/index.html b/examples/vanilla-comparison/index.html
@@ -253,7 +253,7 @@ <h1>Anima<span>Sync</span></h1>
 // ================================================================
 // Config
 // ================================================================
-const VERSION = '0.4.3';
+const VERSION = '0.4.4';
 const CDN_V1 = `https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v1@${VERSION}`;
 const CDN_V2 = `https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@${VERSION}`;
 
@@ -372,26 +372,28 @@ <h1>Anima<span>Sync</span></h1>
     const vrmaBytes = lipsyncInstance.getVrmaBytes();
     if (vrmaBytes?.idle?.length) {
       const anim = await loadVRMAFromBytes(vrmaBytes.idle);
-      if (anim) { idleAct = mixer.clipAction(createVRMAnimationClip(anim, vrm)); idleAct.play(); }
+      if (anim) { idleAct = mixer.clipAction(createVRMAnimationClip(anim, vrm)); idleAct.setLoop(THREE.LoopPingPong); idleAct.play(); }
     }
     if (vrmaBytes?.speaking?.length) {
       const anim = await loadVRMAFromBytes(vrmaBytes.speaking);
-      if (anim) { speakAct = mixer.clipAction(createVRMAnimationClip(anim, vrm)); speakAct.play(); speakAct.setEffectiveWeight(0); }
+      if (anim) { speakAct = mixer.clipAction(createVRMAnimationClip(anim, vrm)); speakAct.setLoop(THREE.LoopPingPong); speakAct.play(); speakAct.setEffectiveWeight(0); }
     }
   } catch (e) { console.warn('VRMA skip:', e.message); }
 
   return { vrm, mixer, idleAction: idleAct, speakingAction: speakAct };
 }
 
-function transitionToSpeaking() { isSpeaking = true; crossFadeProgress = 1; }
+function transitionToSpeaking() { isSpeaking = true; }
 function transitionToIdle() { isSpeaking = false; }
 
 function updateBoneWeights(delta) {
-  const speed = 3.0;
-  if (isSpeaking && crossFadeProgress < 1) crossFadeProgress = Math.min(1, crossFadeProgress + delta * speed);
-  else if (!isSpeaking && crossFadeProgress > 0) crossFadeProgress = Math.max(0, crossFadeProgress - delta * speed);
-  const t = crossFadeProgress;
-  const w = t * t * (3 - 2 * t);
+  const target = isSpeaking ? 1 : 0;
+  const duration = isSpeaking ? 0.8 : 1.0;
+  const step = delta / duration;
+  crossFadeProgress = target > crossFadeProgress
+    ? Math.min(crossFadeProgress + step, 1)
+    : Math.max(crossFadeProgress - step, 0);
+  const w = crossFadeProgress * crossFadeProgress * (3 - 2 * crossFadeProgress);
   if (idleActionV1) idleActionV1.setEffectiveWeight(1 - w);
   if (speakingActionV1) speakingActionV1.setEffectiveWeight(w);
   if (idleActionV2) idleActionV2.setEffectiveWeight(1 - w);
diff --git a/index.html b/index.html
diff --git a/llms-full.txt b/llms-full.txt
diff --git a/llms.txt b/llms.txt

Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,7 @@`
`29`	`29`	`"id": "quick-start-v2",`
`30`	`30`	`"name": "Quick Start with V2 Engine",`
`31`	`31`	`"description": "Install AnimaSync V2, initialize the engine, and process an audio file to get 52 ARKit blendshape animation frames at 30fps.",`
`32`		`- "agent_instructions": "Use this flow when a developer wants to add lip sync animation to a web app. V2 is recommended for most use cases — simpler integration, direct 52-dim prediction.",`
	`32`	`+ "agent_instructions": "Use this flow when a developer wants to add lip sync animation to a web app. V1 is recommended for most use cases — full expression control with built-in VAD and idle expressions.",`
`33`	`33`	`"steps": [`
`34`	`34`	`{`
`35`	`35`	`"action": "install",`
`@@ -150,7 +150,7 @@`
`150`	`150`	`},`
`151`	`151`	`{`
`152`	`152`	`"action": "init-animasync",`
`153`		- "code": "<script type=\"module\">\nconst CDN = 'https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@0.4.3';\nconst { LipSyncWasmWrapper } = await import(`${CDN}/lipsync-wasm-wrapper.js`);\nconst lipsync = new LipSyncWasmWrapper({ wasmPath: `${CDN}/lipsync_wasm_v2.js` });\nawait lipsync.init();\n</script>",
	`153`	+ "code": "<script type=\"module\">\nconst CDN = 'https://cdn.jsdelivr.net/npm/@goodganglabs/lipsync-wasm-v2@0.4.4';\nconst { LipSyncWasmWrapper } = await import(`${CDN}/lipsync-wasm-wrapper.js`);\nconst lipsync = new LipSyncWasmWrapper({ wasmPath: `${CDN}/lipsync_wasm_v2.js` });\nawait lipsync.init();\n</script>",
`154`	`154`	`"description": "Import and initialize AnimaSync V2 from CDN"`
`155`	`155`	`}`
`156`	`156`	`]`