nvidia-riva
diff --git a/‎.gitignore
Lines changed: 19 additions & 0 deletions b/‎.gitignore
Lines changed: 19 additions & 0 deletions
diff --git a/‎app-backend/README.md
Lines changed: 243 additions & 0 deletions b/‎app-backend/README.md
Lines changed: 243 additions & 0 deletions
diff --git a/‎app-backend/download-protos.js
Lines changed: 98 additions & 0 deletions b/‎app-backend/download-protos.js
Lines changed: 98 additions & 0 deletions
@@ -186,3 +186,22 @@ tests/integration/tts/outputs
 riva/client/proto/*_pb2.py
 riva/client/proto/*_pb2_grpc.py
 
+
+# Downloaded/generated proto files and repositories
+app-backend/common/
+app-backend/riva/proto/
+
+# Node.js specific ignores for app-backend
+app-backend/node_modules/
+app-backend/coverage/
+app-backend/.nyc_output/
+app-backend/logs/
+app-backend/*.log
+app-backend/.env
+app-backend/.env.local
+app-backend/.env.development.local
+app-backend/.env.test.local
+app-backend/.env.production.local
+app-backend/npm-debug.log*
+app-backend/yarn-debug.log*
+app-backend/yarn-error.log*
@@ -0,0 +1,243 @@
+# Riva App Backend
+
+This is a Node.js proxy server that connects to the Riva API server. It provides API endpoints for automatic speech recognition (ASR) and text-to-speech (TTS) services.
+
+## Features
+
+- Direct connection to Riva server using official proto files
+- ASR (Automatic Speech Recognition) endpoint
+- TTS (Text-to-Speech) endpoint
+- WAV file support with header analysis and proper processing
+- Configurable via environment variables
+- WebSocket support for real-time streaming recognition
+
+## Setup
+
+1. Ensure you have Node.js installed (v14 or higher recommended)
+
+2. Install dependencies:
+   ```
+   npm install
+   ```
+
+3. Download the proto files:
+   ```
+   npm run download-protos
+   ```
+   This script will clone the nvidia-riva/common repository and copy the necessary proto files to the `riva/proto` directory.
+
+## Configuration
+
+Create a `.env` file in the root directory with the following variables:
+
+```
+PORT=3002
+RIVA_API_URL=localhost:50051
+```
+
+- `PORT`: The port on which the proxy server will run
+- `RIVA_API_URL`: The URL of the Riva API server
+
+## Running the Server
+
+Start the server:
+
+```
+npm start
+```
+
+This will automatically run the `download-protos` script before starting the server if the proto files are not already present.
+
+## Testing the Application
+
+### Prerequisites
+
+Before testing:
+1. Ensure the Riva API server is running at the configured URL
+2. Verify that the proto files have been downloaded successfully
+3. Make sure the Node.js server is running (check for "Server listening on port 3002" message)
+4. Have sample audio files available for testing
+
+### Testing the API Endpoints Directly
+
+#### Testing the Health Endpoint
+
+```bash
+curl http://localhost:3002/health
+```
+
+Expected response:
+```json
+{
+  "status": "ok",
+  "services": {
+    "asr": {
+      "available": true
+    },
+    "tts": {
+      "available": true
+    }
+  }
+}
+```
+
+#### Testing ASR with a WAV File
+
+You can use the included test script:
+
+```bash
+# If you have a sample WAV file
+node test-asr.js /path/to/your/audio.wav
+```
+
+Or test manually with curl:
+
+```bash
+# Convert WAV to base64 first
+base64 -w 0 /path/to/your/audio.wav > audio.b64
+
+# Send the request
+curl -X POST http://localhost:3002/api/recognize \
+  -H "Content-Type: application/json" \
+  -d @- << EOF
+{
+  "audio": "$(cat audio.b64)",
+  "config": {
+    "encoding": "LINEAR_PCM",
+    "sampleRateHertz": 16000,
+    "languageCode": "en-US",
+    "enableAutomaticPunctuation": true
+  }
+}
+EOF
+```
+
+### Testing with the Frontend
+
+The best way to test the complete functionality is using the provided frontend application:
+
+1. Start this backend server
+2. Start the Riva frontend application
+3. Use the frontend to upload audio files or test streaming recognition
+
+### Debugging and Log Information
+
+The server provides detailed logging for audio processing. When processing WAV files, it will:
+
+1. Log detection of WAV headers
+2. Display information about:
+   - Sample rate
+   - Number of channels
+   - Bits per sample
+   - Audio format
+
+When issues occur, check the console output for detailed error messages.
+
+## Troubleshooting Proto Files Download
+
+If you encounter issues downloading proto files:
+
+1. Check your internet connection
+2. Verify that git is installed and accessible
+3. Look for specific errors in the console output
+4. Make sure the `riva_common.proto` file is included in the filter (the download script now includes this file)
+5. Try running the download script manually:
+   ```
+   node download-protos.js
+   ```
+6. If problems persist, you can manually clone the repository and copy the proto files:
+   ```
+   git clone https://github.com/nvidia-riva/common.git
+   mkdir -p riva/proto
+   cp common/riva/proto/*.proto riva/proto/
+   ```
+
+## API Endpoints
+
+### Status
+
+- **GET** `/health`
+  - Returns the status of the ASR and TTS services
+
+### Speech Recognition (ASR)
+
+- **POST** `/api/recognize`
+  - Request body:
+    ```json
+    {
+      "audio": "<base64-encoded audio data>",
+      "config": {
+        "encoding": "LINEAR_PCM",
+        "sampleRateHertz": 16000,
+        "languageCode": "en-US",
+        "maxAlternatives": 1,
+        "enableAutomaticPunctuation": true,
+        "audioChannelCount": 1
+      }
+    }
+    ```
+  - Response:
+    ```json
+    {
+      "results": [
+        {
+          "alternatives": [
+            {
+              "transcript": "recognized text",
+              "confidence": 0.98
+            }
+          ]
+        }
+      ],
+      "text": "recognized text",
+      "confidence": 0.98
+    }
+    ```
+
+### WebSocket Streaming (ASR)
+
+- **WebSocket** `/streaming/asr`
+  - First message (config):
+    ```json
+    {
+      "sampleRate": 16000,
+      "encoding": "LINEAR_PCM",
+      "languageCode": "en-US",
+      "maxAlternatives": 1,
+      "enableAutomaticPunctuation": true
+    }
+    ```
+  - Subsequent messages: Binary audio data (16-bit PCM)
+  - Server responses:
+    ```json
+    {
+      "results": [
+        {
+          "alternatives": [
+            {
+              "transcript": "recognized text"
+            }
+          ]
+        }
+      ],
+      "isPartial": true|false
+    }
+    ```
+
+### Text to Speech (TTS)
+
+- **POST** `/api/synthesize`
+  - Request body:
+    ```json
+    {
+      "text": "Text to be synthesized",
+      "voice": "en-US-Scarlett",
+      "language": "en-US"
+    }
+    ```
+  - Response:
+    ```json
+    {
+      "audio": "<base64-encoded audio data>"
+    }
+    ```
@@ -0,0 +1,98 @@
+#!/usr/bin/env node
+
+const fs = require('fs');
+const path = require('path');
+const { execSync } = require('child_process');
+
+// Paths for proto files and repositories
+const SCRIPT_DIR = __dirname;
+const COMMON_DIR = path.join(SCRIPT_DIR, 'common');
+const PROTO_DIR = path.join(SCRIPT_DIR, 'riva/proto');
+
+console.log('Proto file downloader script');
+console.log(`Script directory: ${SCRIPT_DIR}`);
+console.log(`Common repository target: ${COMMON_DIR}`);
+console.log(`Proto files target: ${PROTO_DIR}`);
+
+// Create directories if they don't exist
+[COMMON_DIR, PROTO_DIR].forEach(dir => {
+  if (!fs.existsSync(dir)) {
+    console.log(`Creating directory: ${dir}`);
+    fs.mkdirSync(dir, { recursive: true });
+  }
+});
+
+// Function to download proto files from nvidia-riva/common repository
+function downloadProtoFiles() {
+  try {
+    console.log('Checking for existing proto files...');
+    
+    // Check if proto directory already contains proto files
+    if (fs.existsSync(path.join(PROTO_DIR, 'riva_asr.proto')) && 
+        fs.existsSync(path.join(PROTO_DIR, 'riva_tts.proto'))) {
+      console.log('Proto files already exist in proto directory, skipping download');
+      return true;
+    }
+    
+    // Check if common repository is already cloned
+    const commonRepoExists = fs.existsSync(path.join(COMMON_DIR, '.git'));
+    
+    if (!commonRepoExists) {
+      console.log('Cloning nvidia-riva/common repository...');
+      execSync(`git clone https://github.com/nvidia-riva/common.git ${COMMON_DIR}`, {
+        stdio: 'inherit'
+      });
+    } else {
+      console.log('Common repository already exists, pulling latest changes...');
+      execSync(`cd ${COMMON_DIR} && git pull`, {
+        stdio: 'inherit'
+      });
+    }
+    
+    // Check if the riva/proto directory exists in the cloned repo
+    const rivaProtoPath = path.join(COMMON_DIR, 'riva', 'proto');
+    if (!fs.existsSync(rivaProtoPath)) {
+      console.error(`Error: Expected directory not found: ${rivaProtoPath}`);
+      return false;
+    }
+    
+    // Copy proto files to our proto directory
+    console.log('Copying proto files to proto directory...');
+    const protoFiles = fs.readdirSync(rivaProtoPath);
+    
+    // Filter for relevant proto files (ASR and TTS)
+    const relevantProtos = protoFiles.filter(file => 
+      file.includes('riva_asr') || file.includes('riva_tts') || file.includes('riva_audio') || file.includes('riva_common')
+    );
+    
+    if (relevantProtos.length === 0) {
+      console.error('No relevant proto files found in the repository');
+      return false;
+    }
+    
+    // Copy each proto file
+    relevantProtos.forEach(file => {
+      const sourcePath = path.join(rivaProtoPath, file);
+      const targetPath = path.join(PROTO_DIR, file);
+      fs.copyFileSync(sourcePath, targetPath);
+      console.log(`Copied: ${file}`);
+    });
+    
+    console.log('Successfully downloaded and copied proto files');
+    console.log('Available proto files:');
+    fs.readdirSync(PROTO_DIR).forEach(file => {
+      console.log(`- ${file}`);
+    });
+    
+    return true;
+  } catch (error) {
+    console.error('Failed to download proto files:', error);
+    return false;
+  }
+}
+
+// Execute the download function
+const success = downloadProtoFiles();
+
+// Exit with appropriate code
+process.exit(success ? 0 : 1);