Updated LocalLab v0.2.2

UtkarshTheDev · UtkarshTheDev · commit 1015fe6d828f · 2025-03-01T23:28:21.000+05:30
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,15 @@
 
 All notable changes for version updates.
 
+## [0.2.2] - 2025-03-03
+
+### Fixed
+
+- Fixed circular import issue between core/app.py and routes/system.py by updating system.py to use get_request_count from logger module directly
+- Made Flash Attention warning less alarming by changing it from a warning to an info message with better explanation
+- Enhanced get_system_info endpoint with cleaner code and better organization
+- Fixed potential issues with GPU info retrieval through better error handling
+
 ## [0.2.0] - 2025-03-02
 
 ### Added
diff --git a/locallab/__init__.py b/locallab/__init__.py
@@ -2,7 +2,7 @@
 LocalLab - A lightweight AI inference server
 """
 
-__version__ = "0.2.1" 
+__version__ = "0.2.2" 
 
 from typing import Dict, Any, Optional
 
diff --git a/locallab/model_manager.py b/locallab/model_manager.py
@@ -52,7 +52,7 @@ def __init__(self):
                 import flash_attn
                 logger.info("Flash Attention enabled")
             except ImportError:
-                logger.warning("Flash Attention not available")
+                logger.info("Flash Attention not available - this is optional and won't affect basic functionality")
     
     def _get_quantization_config(self) -> Optional[Dict[str, Any]]:
         """Get quantization configuration based on settings"""
diff --git a/locallab/routes/system.py b/locallab/routes/system.py
@@ -10,7 +10,8 @@
 import torch
 
 from ..logger import get_logger
-from ..core.app import model_manager, request_count, start_time
+from ..logger.logger import get_request_count, get_uptime_seconds
+from ..core.app import model_manager, start_time
 from ..ui.banners import print_system_resources
 from ..config import system_instructions
 
@@ -50,6 +51,24 @@ def get_gpu_memory() -> Optional[Tuple[int, int]]:
         return None
 
 
+def get_gpu_info() -> Optional[Dict[str, Any]]:
+    """Get detailed GPU information including memory and device name"""
+    try:
+        gpu_mem = get_gpu_memory()
+        if gpu_mem:
+            total_gpu, free_gpu = gpu_mem
+            return {
+                "total_memory": total_gpu,
+                "free_memory": free_gpu,
+                "used_memory": total_gpu - free_gpu,
+                "device": torch.cuda.get_device_name(0)
+            }
+        return None
+    except Exception as e:
+        logger.debug(f"Failed to get GPU info: {str(e)}")
+        return None
+
+
 @router.post("/system/instructions")
 async def update_system_instructions(request: SystemInstructionsRequest) -> Dict[str, str]:
     """Update system instructions"""
@@ -84,35 +103,32 @@ async def reset_system_instructions(model_id: Optional[str] = None) -> Dict[str,
 
 
 @router.get("/system/info", response_model=SystemInfoResponse)
-async def system_info() -> SystemInfoResponse:
-    """Get detailed system information"""
+async def get_system_info():
+    """Get system information including CPU, memory, GPU usage, and server stats"""
     try:
-        cpu_usage = psutil.cpu_percent()
+        # Get CPU and memory usage
+        cpu_percent = psutil.cpu_percent()
         memory = psutil.virtual_memory()
-        gpu_info = None
+        memory_percent = memory.percent
         
-        if torch.cuda.is_available():
-            gpu_mem = get_gpu_memory()
-            if gpu_mem:
-                total_gpu, free_gpu = gpu_mem
-                gpu_info = {
-                    "total_memory": total_gpu,
-                    "free_memory": free_gpu,
-                    "used_memory": total_gpu - free_gpu,
-                    "device": torch.cuda.get_device_name(0)
-                }
+        # Get GPU info if available
+        gpu_info = get_gpu_info() if torch.cuda.is_available() else None
         
+        # Get server stats
+        uptime = time.time() - start_time
+        
+        # Return combined info
         return SystemInfoResponse(
-            cpu_usage=cpu_usage,
-            memory_usage=memory.percent,
+            cpu_usage=cpu_percent,
+            memory_usage=memory_percent,
             gpu_info=gpu_info,
             active_model=model_manager.current_model,
-            uptime=time.time() - start_time,
-            request_count=request_count
+            uptime=uptime,
+            request_count=get_request_count()  # Use the function from logger.logger instead
         )
     except Exception as e:
-        logger.error(f"Failed to get system info: {str(e)}")
-        raise HTTPException(status_code=500, detail=str(e))
+        logger.error(f"Error getting system info: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"Error getting system info: {str(e)}")
 
 
 @router.get("/health")
diff --git a/setup.py b/setup.py
@@ -5,7 +5,7 @@
 
 setup(
     name="locallab",
-    version="0.2.1",
+    version="0.2.2",
     packages=find_packages(include=["locallab", "locallab.*"]),
     install_requires=[
         "fastapi>=0.68.0,<1.0.0",