open-edge-platform
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/embedding/pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎usecases/ai/edge-ai-demo-studio/workers/embedding/pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/embedding/utils/rag_engine.py‎
Lines changed: 2 additions & 2 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/embedding/utils/rag_engine.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/embedding/utils/util.py‎
Lines changed: 1 addition & 0 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/embedding/utils/util.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/embedding/uv.lock‎
Lines changed: 2 additions & 15 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/embedding/uv.lock‎
Lines changed: 2 additions & 15 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/image-generation/utils/util.py‎
Lines changed: 1 addition & 0 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/image-generation/utils/util.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/speech-to-text/utils.py‎
Lines changed: 1 addition & 0 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/speech-to-text/utils.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/text-generation/utils/util.py‎
Lines changed: 1 addition & 0 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/text-generation/utils/util.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎usecases/ai/edge-ai-demo-studio/workers/text-to-speech/kokoro/utils.py‎
Lines changed: 1 addition & 0 deletions b/‎usecases/ai/edge-ai-demo-studio/workers/text-to-speech/kokoro/utils.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎usecases/ai/visual-text-driven-document-reasoning-engine/.gitignore‎
Lines changed: 31 additions & 0 deletions b/‎usecases/ai/visual-text-driven-document-reasoning-engine/.gitignore‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎usecases/ai/visual-text-driven-document-reasoning-engine/README.md‎
Lines changed: 98 additions & 0 deletions b/‎usecases/ai/visual-text-driven-document-reasoning-engine/README.md‎
Lines changed: 98 additions & 0 deletions
@@ -34,7 +34,7 @@ dependencies = [
     "langchainhub==0.1.21",
     # Document Processing
     "unstructured==0.18.3",
-    "pdfminer.six==20251107",
+    "pypdf>=6.3.0",
     # Database and Modeling
     "sqlmodel>=0.0.24",
 ]
 
@@ -15,7 +15,7 @@
 from langchain_community.document_loaders import (
     CSVLoader,
     EverNoteLoader,
-    PDFMinerLoader,
+    PyPDFLoader,
     TextLoader,
     UnstructuredEPubLoader,
     UnstructuredHTMLLoader,
@@ -45,7 +45,7 @@
     ".html": (UnstructuredHTMLLoader, {}),
     ".md": (UnstructuredMarkdownLoader, {}),
     ".odt": (UnstructuredODTLoader, {}),
-    ".pdf": (PDFMinerLoader, {}),
+    ".pdf": (PyPDFLoader, {}),
     ".ppt": (UnstructuredPowerPointLoader, {}),
     ".pptx": (UnstructuredPowerPointLoader, {}),
     ".txt": (TextLoader, {"encoding": "utf8"}),
 
@@ -51,6 +51,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:
         "/tmp",  # Temporary directory
         "/var/cache",  # System cache directory
         "/opt",  # Optional software directory
+        "/mnt",  # Mounted drives
     ]
 
     # Check if the resolved path is within allowed directories
 
@@ -51,6 +51,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:
         "/tmp",  # Temporary directory
         "/var/cache",  # System cache directory
         "/opt",  # Optional software directory
+        "/mnt",  # Mounted drives
     ]
 
     # Check if the resolved path is within allowed directories
 
@@ -70,6 +70,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:
         "/tmp",  # Temporary directory
         "/var/cache",  # System cache directory
         "/opt",  # Optional software directory
+        "/mnt",  # Mounted drives
     ]
 
     # Check if the resolved path is within allowed directories
 
@@ -51,6 +51,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:
         "/tmp",  # Temporary directory
         "/var/cache",  # System cache directory
         "/opt",  # Optional software directory
+        "/mnt",  # Mounted drives
     ]
 
     # Check if the resolved path is within allowed directories
 
@@ -68,6 +68,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:
         "/tmp",  # Temporary directory
         "/var/cache",  # System cache directory
         "/opt",  # Optional software directory
+        "/mnt",  # Mounted drives
     ]
 
     # Check if the resolved path is within allowed directories
 
@@ -0,0 +1,31 @@
+# Python virtual environment
+.venv
+
+# PyTorch model files
+*.pt
+
+# Python cache files
+__pycache__/
+
+# Test files and folders
+test/
+test*
+
+# Embeddings folder
+embeddings
+
+#Error logs
+*errors.txt
+
+#VLM Models
+models
+
+# VS Code cache
+.vscode
+
+# Config file
+config.py
+
+# History
+history
+history.json
@@ -0,0 +1,98 @@
+<!-- Copyright (C) 2025 Intel Corporation -->
+<!-- SPDX-License-Identifier: Apache-2.0  -->
+# Visual Textual Query-driven Document Reasoning Engine
+
+## Overview
+
+The Visual Textual Query-driven Document Reasoning Engine is an AI-powered tool that combines Vision-Language Models (VLMs) with document retrieval capabilities to enable intelligent, context-aware querying of technical documentation. This engine allows users to ask natural language questions about complex visual and textual content within PDF documents, with support for component identification through image uploads.
+
+![Architecture Diagram](assets/architecture_diagram.png)
+
+### Key Features
+
+- **Multi-modal Document Retrieval**: Indexes PDF documents using advanced vision-language embeddings for semantic search
+- **Component-based Querying**: Upload images of specific components to retrieve relevant documentation pages
+- **Intelligent Visual Understanding**: Automatically identifies components from images and matches them against predefined taxonomies
+- **Agentic Response Generation**: Provides contextual, page-specific answers based on retrieved documentation
+- **Hardware Acceleration**: Optimized for Intel hardware (iGPU/dGPU) using OpenVINO and PyTorch XPU
+- **Interactive Web Interface**: User-friendly Gradio-based UI with query history and visual feedback
+- **Configurable Use Cases**: Easily adaptable to different domains (e.g., robotics manuals, IPC regulations, safety documentation)
+
+### Use Cases
+
+The engine is designed to be domain-agnostic and can be configured for various applications:
+- **Industrial Equipment Manuals**: Query robotic arm operation guides, safety procedures, and maintenance instructions
+- **Electronic Standards Compliance**: Navigate IPC regulations and component specifications
+- **Technical Documentation**: Search through complex visual-heavy manuals with natural language
+- **Training and Support**: Enable field technicians to quickly find relevant information using component photos
+
+
+## Verified Configurations
+The following hardware and OS configurations have been tested and verified:
+
+- **Arrow Lake - H (iGPU)**
+   - Intel(R) Core(TM) Ultra 9 285H
+   - 64 GB RAM
+   - 1 TB storage
+   - Ubuntu 24.02
+   - Python 3.12
+
+- **Arrow Lake - S (dGPU)**
+   - Intel(R) Core(TM) Ultra 9 285
+   - 64 GB RAM
+   - 1 TB storage
+   - Ubuntu 24.02
+   - Python 3.12
+   - Arc A770 (16GB)
+
+## Prerequisites
+Ensure the GPU drivers are installed using the [`gpu_installer.sh`](https://github.com/open-edge-platform/edge-developer-kit-reference-scripts/blob/main/gpu_installer.sh)
+
+## Installation
+1. **Install the necessary dependencies.**
+   ```bash
+   apt-get update
+   apt-get install -y python3-venv poppler-utils
+   ```
+
+2. **Create and activate a Python virtual environment:**
+   ```bash
+   python3 -m venv .venv
+   source .venv/bin/activate
+   ```
+
+3. **Install remaining Python dependencies:**
+   ```bash
+   pip install -r requirements.txt
+   ```
+   
+4. **Install PyTorch and Intel Extension for XPU support first:**
+   ```bash
+   pip install -U --force-reinstall --no-cache-dir torch torchvision torchaudio --index-url https://download.pytorch.org/whl/xpu   
+   ```
+
+5. **Create the config file:**
+   Create the `config.py` file by copying the content from `config.py.template` and modify the values to experiment with the tool. Few examples are available in the `./assets/usecases`.
+
+## Usage
+1. **Activate the Python virtual environment created earlier (if not activated yet):**
+   ```bash
+   source .venv/bin/activate
+   ```
+
+2. **Run the app using following command:**
+   - On Arrow Lake systems without a dGPU:
+      ```bash
+      unset ONEAPI_DEVICE_SELECTOR && unset OPENVINO_DEVICE && python main.py
+      ```
+   - On Arrow Lake systems with an A770:
+      - to run fully on dGPU:
+         ```bash
+         ONEAPI_DEVICE_SELECTOR=level_zero:0 OPENVINO_DEVICE=GPU.1 python main.py
+         ```
+      - to run fully on iGPU:
+         ```bash
+         ONEAPI_DEVICE_SELECTOR=level_zero:1 OPENVINO_DEVICE=GPU.0 python main.py
+         ```
+
+Then open the provided local URL in your browser.
Original file line number	Diff line number	Diff line change
`@@ -34,7 +34,7 @@ dependencies = [`
`34`	`34`	`"langchainhub==0.1.21",`
`35`	`35`	`# Document Processing`
`36`	`36`	`"unstructured==0.18.3",`
`37`		`- "pdfminer.six==20251107",`
	`37`	`+ "pypdf>=6.3.0",`
`38`	`38`	`# Database and Modeling`
`39`	`39`	`"sqlmodel>=0.0.24",`
`40`	`40`	`]`
Original file line number	Diff line number	Diff line change
`@@ -51,6 +51,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:`
`51`	`51`	`"/tmp", # Temporary directory`
`52`	`52`	`"/var/cache", # System cache directory`
`53`	`53`	`"/opt", # Optional software directory`
	`54`	`+ "/mnt", # Mounted drives`
`54`	`55`	`]`
`55`	`56`
`56`	`57`	`# Check if the resolved path is within allowed directories`
Original file line number	Diff line number	Diff line change
`@@ -70,6 +70,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:`
`70`	`70`	`"/tmp", # Temporary directory`
`71`	`71`	`"/var/cache", # System cache directory`
`72`	`72`	`"/opt", # Optional software directory`
	`73`	`+ "/mnt", # Mounted drives`
`73`	`74`	`]`
`74`	`75`
`75`	`76`	`# Check if the resolved path is within allowed directories`
Original file line number	Diff line number	Diff line change
`@@ -68,6 +68,7 @@ def validate_and_sanitize_cache_dir(cache_dir: str) -> str:`
`68`	`68`	`"/tmp", # Temporary directory`
`69`	`69`	`"/var/cache", # System cache directory`
`70`	`70`	`"/opt", # Optional software directory`
	`71`	`+ "/mnt", # Mounted drives`
`71`	`72`	`]`
`72`	`73`
`73`	`74`	`# Check if the resolved path is within allowed directories`