microsoft
diff --git a/‎mobile/AndroidDualAppProject/ModelTest.java‎
Lines changed: 157 additions & 0 deletions b/‎mobile/AndroidDualAppProject/ModelTest.java‎
Lines changed: 157 additions & 0 deletions
diff --git a/‎mobile/AndroidDualAppProject/README.md‎
Lines changed: 159 additions & 0 deletions b/‎mobile/AndroidDualAppProject/README.md‎
Lines changed: 159 additions & 0 deletions
diff --git a/‎mobile/AndroidDualAppProject/build.gradle.kts‎
Lines changed: 9 additions & 0 deletions b/‎mobile/AndroidDualAppProject/build.gradle.kts‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎mobile/AndroidDualAppProject/clean_locks.ps1‎
Lines changed: 50 additions & 0 deletions b/‎mobile/AndroidDualAppProject/clean_locks.ps1‎
Lines changed: 50 additions & 0 deletions
@@ -0,0 +1,157 @@
+package com.example.modeltest;
+
+import java.io.File;
+import java.util.Scanner;
+
+import ai.onnxruntime.genai.GenAIException;
+import ai.onnxruntime.genai.Generator;
+import ai.onnxruntime.genai.GeneratorParams;
+import ai.onnxruntime.genai.Model;
+import ai.onnxruntime.genai.Sequences;
+import ai.onnxruntime.genai.Tokenizer;
+import ai.onnxruntime.genai.TokenizerStream;
+
+/**
+ * Standalone Java application to test the Phi-3 model locally
+ * 
+ * Usage:
+ * 1. Make sure you have the model files in the directory specified by MODEL_PATH
+ * 2. Compile and run this application
+ * 3. Enter prompts to test the model
+ * 4. Type 'exit' to quit
+ */
+public class ModelTest {
+    
+    // Change this to the path where you have the model files locally
+    private static final String MODEL_PATH = "C:\\Users\\shekadam\\.aitk\\models\\Microsoft\\Phi-3.5-mini-instruct-generic-cpu\\cpu-int4-rtn-block-32-acc-level-4";
+    
+    public static void main(String[] args) {
+        System.out.println("Phi-3 Model Test Application");
+        System.out.println("============================");
+        
+        // Check if model directory exists
+        File modelDir = new File(MODEL_PATH);
+        if (!modelDir.exists() || !modelDir.isDirectory()) {
+            System.err.println("Model directory not found at: " + MODEL_PATH);
+            System.err.println("Please update the MODEL_PATH in the source code.");
+            return;
+        }
+        
+        // Check for model files
+        File[] onnxFiles = modelDir.listFiles((dir, name) -> name.endsWith(".onnx"));
+        if (onnxFiles == null || onnxFiles.length == 0) {
+            System.err.println("No ONNX files found in directory: " + MODEL_PATH);
+            return;
+        }
+        
+        System.out.println("Found " + onnxFiles.length + " ONNX files in model directory");
+        System.out.println("Initializing model, please wait...");
+        
+        Model model = null;
+        Tokenizer tokenizer = null;
+        
+        try {
+            // Initialize model and tokenizer
+            long startTime = System.currentTimeMillis();
+            model = new Model(MODEL_PATH);
+            tokenizer = model.createTokenizer();
+            long initTime = System.currentTimeMillis() - startTime;
+            
+            System.out.println("Model initialized successfully in " + initTime + "ms");
+            System.out.println("Enter your prompts, or type 'exit' to quit:");
+            
+            // Process user prompts
+            Scanner scanner = new Scanner(System.in);
+            while (true) {
+                System.out.print("\nPrompt> ");
+                String input = scanner.nextLine().trim();
+                
+                if (input.equalsIgnoreCase("exit")) {
+                    break;
+                }
+                
+                if (input.isEmpty()) {
+                    continue;
+                }
+                
+                generateResponse(model, tokenizer, input);
+            }
+            
+            scanner.close();
+            
+        } catch (GenAIException e) {
+            System.err.println("Error initializing model: " + e.getMessage());
+            e.printStackTrace();
+        } finally {
+            // Clean up resources
+            if (tokenizer != null) tokenizer.close();
+            if (model != null) model.close();
+        }
+    }
+    
+    private static void generateResponse(Model model, Tokenizer tokenizer, String prompt) {
+        TokenizerStream stream = null;
+        GeneratorParams generatorParams = null;
+        Sequences encodedPrompt = null;
+        Generator generator = null;
+        
+        try {
+            long startTime = System.currentTimeMillis();
+            
+            // Format prompt for Phi-3 model
+            String promptFormatted = "<s>You are a helpful AI assistant. Answer in two paragraphs or less<|end|><|user|>" + 
+                                    prompt + "<|end|>\n<assistant|>";
+            
+            // Create tokenizer stream
+            stream = tokenizer.createStream();
+            
+            // Create generator parameters
+            generatorParams = model.createGeneratorParams();
+            generatorParams.setSearchOption("max_length", 100L);
+            generatorParams.setSearchOption("temperature", 0.7);
+            generatorParams.setSearchOption("top_p", 0.9);
+            
+            // Encode the prompt
+            encodedPrompt = tokenizer.encode(promptFormatted);
+            generatorParams.setInput(encodedPrompt);
+            
+            // Create generator
+            generator = new Generator(model, generatorParams);
+            
+            StringBuilder result = new StringBuilder();
+            System.out.print("\nGenerating: ");
+            
+            // Generate tokens until done
+            int tokenCount = 0;
+            while (!generator.isDone()) {
+                generator.computeLogits();
+                generator.generateNextToken();
+                
+                int token = generator.getLastTokenInSequence(0);
+                String decodedToken = stream.decode(token);
+                result.append(decodedToken);
+                
+                // Print progress
+                System.out.print(decodedToken);
+                tokenCount++;
+            }
+            
+            long totalTime = System.currentTimeMillis() - startTime;
+            double tokensPerSecond = tokenCount * 1000.0 / totalTime;
+            
+            System.out.println("\n\nGeneration complete!");
+            System.out.println("Time: " + totalTime + "ms for " + tokenCount + " tokens (" + 
+                             String.format("%.2f", tokensPerSecond) + " tokens/sec)");
+            
+        } catch (Exception e) {
+            System.err.println("\nError generating response: " + e.getMessage());
+            e.printStackTrace();
+        } finally {
+            // Clean up resources
+            if (generator != null) generator.close();
+            if (encodedPrompt != null) encodedPrompt.close();
+            if (stream != null) stream.close();
+            if (generatorParams != null) generatorParams.close();
+        }
+    }
+}
@@ -0,0 +1,159 @@
+# Android Dual App Project
+
+This project demonstrates a dual-app architecture for on-device AI inference using ONNX Runtime on Android.
+
+## Overview
+
+The project consists of two separate Android applications:
+
+1. **UI App**: Provides user interface for input collection and result display.
+2. **AI App**: Handles the AI model loading and inference using ONNX Runtime and ONNX Runtime GenAI.
+
+## Architecture
+
+The apps communicate using Android's Inter-Process Communication (IPC) mechanism via AIDL (Android Interface Definition Language).
+
+```
++-------------+           +-------------+
+|             |           |             |
+|   UI App    |<--------->|   AI App    |
+| (User Input)|    AIDL   | (Inference) |
+|             |           |             |
++-------------+           +-------------+
+                               |
+                               v
+                          +----------+
+                          |  ONNX    |
+                          |  Model   |
+                          +----------+
+```
+
+### Why Two Separate Apps?
+
+This dual-app architecture provides several benefits:
+
+1. **Memory Isolation**: The AI inference process runs in a separate memory space from the UI, preventing the UI from becoming unresponsive during inference.
+
+2. **Process Separation**: If the model inference causes crashes or excessive memory usage, it won't crash the UI app.
+
+3. **Resource Management**: The AI app can be configured to run at a different priority level than the UI app.
+
+4. **Update Flexibility**: The AI model implementation can be updated independently of the UI application.
+
+5. **Security**: Sensitive model operations are isolated from the user-facing app.
+
+### Communication Flow
+
+1. The UI App binds to the AIApp's InferenceService using AIDL.
+2. User enters a prompt in the UI App.
+3. The prompt is sent via AIDL to the AIApp.
+4. The AIApp loads the model (if not already loaded) and performs inference.
+5. The AIApp returns the generated response back to the UI App.
+6. The UI App displays the response to the user.
+
+## Key Components
+
+### UI App
+
+- `MainActivity`: Manages the user interface and communication with the AI App.
+- `IInferenceService.aidl`: Interface definition for communicating with the AI App's service.
+
+### AI App
+
+- `InferenceService`: Android Service that manages the AI model and processes inference requests.
+- `ModelManager`: Handles the ONNX Runtime model initialization and inference.
+- `ModelDownloader`: Utility for downloading or extracting model files.
+- `IInferenceService.aidl`: Interface implementation for the service.
+
+## Dependencies
+
+- ONNX Runtime for Android: `com.microsoft.onnxruntime:onnxruntime-android:1.16.1`
+- ONNX Runtime GenAI: `onnxruntime-genai-android-0.4.0-dev.aar`
+
+## Setup and Running
+
+### Building the Apps
+
+1. Open the project in Android Studio
+2. Build both the AIApp and UIApp modules
+3. Make sure you have the `onnxruntime-genai-android-0.4.0-dev.aar` file in the `AIApp/libs/` folder
+
+### Setting up the Model Files
+
+1. Download the Microsoft Phi-3.5-mini model files (ONNX format)
+2. Use the provided PowerShell script to push the model to your device:
+
+```powershell
+.\push_model.ps1 -modelDir "path\to\model\directory"
+```
+
+Or manually push the files via ADB:
+
+```powershell
+adb shell mkdir -p /sdcard/phi-3-model
+adb push path\to\model-file.onnx /sdcard/phi-3-model/
+adb push path\to\tokenizer.json /sdcard/phi-3-model/
+```
+
+### Running the Apps
+
+1. Install both apps on your Android device
+2. Launch the AI App first to initialize the service
+3. Grant necessary storage permissions when prompted
+4. Start the service using the button in the AIApp
+5. Launch the UI App which will automatically connect to the AI service
+6. Enter prompts in the UIApp and receive model responses
+
+### Monitoring Performance
+
+The apps provide detailed performance logs via Android logcat. Connect your device to a computer and run:
+
+```powershell
+adb logcat -s ModelManager:D MemoryMonitor:D InferenceService:D UIApp:D
+```
+
+## Permissions
+
+The application requires the following permissions:
+
+- `READ_EXTERNAL_STORAGE` / `WRITE_EXTERNAL_STORAGE` - For accessing model files in external storage
+- `READ_MEDIA_*` (Android 13+) - For accessing model files on newer Android versions
+
+For Android 10+ devices, the app uses `requestLegacyExternalStorage="true"` to ensure compatibility with older storage access methods.
+
+## Model Setup
+
+### Pushing Model Files to Device using ADB
+
+The app is configured to load model files from `/sdcard/phi-3-model/` directory on your Android device. Follow these steps to push the model files:
+
+1. Download the Phi-3.5 model files (the ONNX format files) from Microsoft or HuggingFace
+2. Connect your Android device to your computer
+3. Enable USB debugging on your device
+4. Open a terminal and use these ADB commands:
+
+```bash
+# Create directory on device
+adb shell mkdir -p /sdcard/phi-3-model
+
+# Push model files to device
+adb push path/to/model-file.onnx /sdcard/phi-3-model/
+adb push path/to/tokenizer.json /sdcard/phi-3-model/
+# Push any other required model files
+```
+
+5. Verify files were transferred correctly:
+```bash
+adb shell ls -la /sdcard/phi-3-model/
+```
+
+### Alternative Setup Methods
+
+For a production app, you might want to:
+1. Copy the model files to the app's assets folder
+2. Extract them at runtime to the app's internal storage
+3. Or download them from a server at runtime
+
+## License
+
+[Your license information here]
@@ -0,0 +1,9 @@
+// Top-level build file where you can add configuration options common to all sub-projects/modules.
+plugins {
+    id("com.android.application") version "8.2.0" apply false
+    id("org.jetbrains.kotlin.android") version "1.9.0" apply false
+}
+
+tasks.register("clean", Delete::class) {
+    delete(rootProject.buildDir)
+}
@@ -0,0 +1,50 @@
+# PowerShell script to handle stubborn file locks
+Write-Host "Attempting to resolve file lock issues..."
+
+$buildPath = "AIApp\build"
+$problematicFile = "AIApp\build\intermediates\compile_and_runtime_not_namespaced_r_class_jar\debug\R.jar"
+
+# Stop all Gradle processes
+Write-Host "Stopping Gradle daemons..."
+& .\gradlew --stop
+
+# Wait for processes to settle
+Start-Sleep -Seconds 3
+
+# Try to remove the specific problematic file first
+if (Test-Path $problematicFile) {
+    Write-Host "Attempting to remove problematic R.jar file..."
+    try {
+        Remove-Item -Path $problematicFile -Force -ErrorAction Stop
+        Write-Host "Successfully removed R.jar"
+    } catch {
+        Write-Host "R.jar still locked, attempting workaround..."
+        
+        # Try to move the file to a temp location first
+        $tempFile = "$env:TEMP\R_$(Get-Date -Format 'yyyyMMdd_HHmmss').jar"
+        try {
+            Move-Item -Path $problematicFile -Destination $tempFile -Force
+            Write-Host "Moved locked file to temp location: $tempFile"
+        } catch {
+            Write-Host "Could not move file, it's still locked by a process"
+        }
+    }
+}
+
+# Now try to remove the entire build directory
+if (Test-Path $buildPath) {
+    Write-Host "Removing build directory..."
+    try {
+        Remove-Item -Path $buildPath -Recurse -Force -ErrorAction Stop
+        Write-Host "Successfully removed build directory"
+    } catch {
+        Write-Host "Some files in build directory are still locked"
+    }
+}
+
+# Wait and try Gradle clean
+Start-Sleep -Seconds 2
+Write-Host "Attempting Gradle clean..."
+& .\gradlew clean --no-daemon --no-build-cache
+
+Write-Host "Script completed."