ModelEngine-Group
diff --git a/‎backend/apps/vectordatabase_app.py‎
Lines changed: 13 additions & 4 deletions b/‎backend/apps/vectordatabase_app.py‎
Lines changed: 13 additions & 4 deletions
diff --git a/‎backend/services/vectordatabase_service.py‎
Lines changed: 31 additions & 15 deletions b/‎backend/services/vectordatabase_service.py‎
Lines changed: 31 additions & 15 deletions
@@ -202,14 +202,23 @@ def health_check(vdb_core: VectorDatabaseCore = Depends(get_vector_db_core)):
 def get_index_chunks(
         index_name: str = Path(...,
                                description="Name of the index to get chunks from"),
-        batch_size: int = Query(
-            1000, description="Number of records to fetch per request"),
+        page: int = Query(
+            None, description="Page number (1-based) for pagination"),
+        page_size: int = Query(
+            None, description="Number of records per page for pagination"),
+        path_or_url: Optional[str] = Query(
+            None, description="Filter chunks by document path_or_url"),
         vdb_core: VectorDatabaseCore = Depends(get_vector_db_core)
 ):
-    """Get all chunks from the specified index"""
+    """Get chunks from the specified index, with optional pagination support"""
     try:
         result = ElasticSearchService.get_index_chunks(
-            index_name, batch_size, vdb_core)
+            index_name=index_name,
+            page=page,
+            page_size=page_size,
+            path_or_url=path_or_url,
+            vdb_core=vdb_core,
+        )
         return JSONResponse(status_code=HTTPStatus.OK, content=result)
     except Exception as e:
         error_msg = str(e)
 
@@ -575,7 +575,8 @@ async def list_files(
                     'file_size': file_info.get('file_size', 0),
                     'create_time': int(utc_create_timestamp * 1000),
                     'status': "COMPLETED",
-                    'latest_task_id': ''
+                    'latest_task_id': '',
+                    'chunk_count': file_info.get('chunk_count', 0)
                 }
                 files.append(file_data)
 
@@ -633,7 +634,7 @@ async def list_files(
                 # Initialize chunks for all files
                 for file_data in files:
                     file_data['chunks'] = []
-                    file_data['chunk_count'] = 0
+                    file_data['chunk_count'] = file_data.get('chunk_count', 0)
 
                 if msearch_body:
                     try:
@@ -670,7 +671,7 @@ async def list_files(
             else:
                 for file_data in files:
                     file_data['chunks'] = []
-                    file_data['chunk_count'] = 0
+                    file_data['chunk_count'] = file_data.get('chunk_count', 0)
 
             return {"files": files}
 
@@ -925,27 +926,39 @@ def get_summary(index_name: str = Path(..., description="Name of the index to ge
 
     @staticmethod
     def get_index_chunks(
-            index_name: str = Path(...,
-                                   description="Name of the index to get chunks from"),
-            batch_size: int = Query(
-                1000, description="Number of records to fetch per request"),
-            vdb_core: VectorDatabaseCore = Depends(get_vector_db_core)
+        index_name: str,
+        page: Optional[int] = None,
+        page_size: Optional[int] = None,
+        path_or_url: Optional[str] = None,
+        vdb_core: VectorDatabaseCore = Depends(get_vector_db_core),
     ):
         """
-        Retrieve all chunk records for the specified index.
+        Retrieve chunk records for the specified index with optional pagination.
 
         Args:
             index_name: Name of the index to query
-            batch_size: Number of records to fetch per request
+            page: Page number (1-based) when paginating
+            page_size: Page size when paginating
+            path_or_url: Optional document filter
             vdb_core: VectorDatabaseCore instance
 
         Returns:
-            Dictionary containing status and list of chunks
+            Dictionary containing status, chunk list, total, and pagination metadata
         """
         try:
-            chunks = vdb_core.get_index_chunks(index_name, batch_size)
-            filtered_chunks = []
-            for chunk in chunks:
+            result = vdb_core.get_index_chunks(
+                index_name,
+                page=page,
+                page_size=page_size,
+                path_or_url=path_or_url,
+            )
+            raw_chunks = result.get("chunks", [])
+            total = result.get("total", len(raw_chunks))
+            result_page = result.get("page", page)
+            result_page_size = result.get("page_size", page_size)
+
+            filtered_chunks: List[Any] = []
+            for chunk in raw_chunks:
                 if isinstance(chunk, dict):
                     filtered_chunks.append(
                         {
@@ -956,11 +969,14 @@ def get_index_chunks(
                     )
                 else:
                     filtered_chunks.append(chunk)
+
             return {
                 "status": "success",
                 "message": f"Successfully retrieved {len(filtered_chunks)} chunks from index {index_name}",
                 "chunks": filtered_chunks,
-                "total": len(filtered_chunks)
+                "total": total,
+                "page": result_page,
+                "page_size": result_page_size
             }
         except Exception as e:
             error_msg = f"Error retrieving chunks from index {index_name}: {str(e)}"