MervinPraison
diff --git a/‎docker/Dockerfile.chat‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.chat‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docker/Dockerfile.dev‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.dev‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docker/Dockerfile.ui‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.ui‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/praisonai-agents/.github/workflows/benchmark.yml‎
Lines changed: 140 additions & 0 deletions b/‎src/praisonai-agents/.github/workflows/benchmark.yml‎
Lines changed: 140 additions & 0 deletions
diff --git a/‎src/praisonai-agents/03_agent_with_tools_monitoring.py‎
Lines changed: 2 additions & 1 deletion b/‎src/praisonai-agents/03_agent_with_tools_monitoring.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/praisonai-agents/benchmarks/TOOLS_BENCHMARK_RESULTS.md‎
Lines changed: 11 additions & 11 deletions b/‎src/praisonai-agents/benchmarks/TOOLS_BENCHMARK_RESULTS.md‎
Lines changed: 11 additions & 11 deletions
@@ -16,7 +16,7 @@ RUN mkdir -p /root/.praison
 # Install Python packages (using latest versions)
 RUN pip install --no-cache-dir \
     praisonai_tools \
-    "praisonai>=3.10.12" \
+    "praisonai>=3.10.13" \
     "praisonai[chat]" \
     "embedchain[github,youtube]"
 
 
@@ -20,7 +20,7 @@ RUN mkdir -p /root/.praison
 # Install Python packages (using latest versions)
 RUN pip install --no-cache-dir \
     praisonai_tools \
-    "praisonai>=3.10.12" \
+    "praisonai>=3.10.13" \
     "praisonai[ui]" \
     "praisonai[chat]" \
     "praisonai[realtime]" \
 
@@ -16,7 +16,7 @@ RUN mkdir -p /root/.praison
 # Install Python packages (using latest versions)
 RUN pip install --no-cache-dir \
     praisonai_tools \
-    "praisonai>=3.10.12" \
+    "praisonai>=3.10.13" \
     "praisonai[ui]" \
     "praisonai[crewai]"
 
 
@@ -138,3 +138,143 @@ jobs:
           else
             echo "Quick benchmark not found, skipping"
           fi
+
+  # Real API benchmark - only runs when API keys are available
+  # Triggered manually or on main branch with secrets
+  real-api-benchmark:
+    runs-on: ubuntu-latest
+    timeout-minutes: 15
+    if: github.event_name == 'workflow_dispatch' || (github.ref == 'refs/heads/main' && github.event_name == 'push')
+    
+    steps:
+      - uses: actions/checkout@v4
+      
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.11'
+          cache: 'pip'
+      
+      - name: Install package
+        run: |
+          pip install -e .
+          pip install pytest
+      
+      - name: Check API Key Availability
+        id: check_keys
+        run: |
+          if [ -n "${{ secrets.OPENAI_API_KEY }}" ]; then
+            echo "has_openai=true" >> $GITHUB_OUTPUT
+            echo "✅ OpenAI API key available"
+          else
+            echo "has_openai=false" >> $GITHUB_OUTPUT
+            echo "⚠️ OpenAI API key not available, skipping real API tests"
+          fi
+      
+      - name: Run Real API Benchmark
+        if: steps.check_keys.outputs.has_openai == 'true'
+        env:
+          OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+        run: |
+          python -c "
+          import time
+          import os
+          
+          # Verify API key is set
+          if not os.environ.get('OPENAI_API_KEY'):
+              print('❌ OPENAI_API_KEY not set')
+              exit(1)
+          
+          from praisonaiagents import Agent
+          
+          # Create a simple agent
+          agent = Agent(
+              name='BenchmarkAgent',
+              instructions='You are a helpful assistant. Be concise.',
+              llm='gpt-4o-mini',
+              output='silent'
+          )
+          
+          # Warmup run
+          print('Running warmup...')
+          agent.chat('Say hello in one word')
+          
+          # Benchmark runs
+          print('Running benchmark (3 iterations)...')
+          times = []
+          for i in range(3):
+              start = time.perf_counter()
+              response = agent.chat('What is 2+2? Answer with just the number.')
+              elapsed = time.perf_counter() - start
+              times.append(elapsed)
+              print(f'  Run {i+1}: {elapsed:.2f}s')
+          
+          avg = sum(times) / len(times)
+          print(f'')
+          print(f'Real API Benchmark Results:')
+          print(f'  Average response time: {avg:.2f}s')
+          print(f'  Min: {min(times):.2f}s')
+          print(f'  Max: {max(times):.2f}s')
+          
+          # Verify response quality
+          if '4' in response:
+              print('✅ Response quality check passed')
+          else:
+              print(f'⚠️ Unexpected response: {response}')
+          "
+      
+      - name: Run Multi-Agent Benchmark
+        if: steps.check_keys.outputs.has_openai == 'true'
+        env:
+          OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+        run: |
+          python -c "
+          import time
+          import os
+          
+          from praisonaiagents import Agent, Agents, Task
+          
+          # Create agents
+          researcher = Agent(
+              name='Researcher',
+              instructions='You research topics. Be brief.',
+              llm='gpt-4o-mini',
+              output='silent'
+          )
+          
+          writer = Agent(
+              name='Writer', 
+              instructions='You write summaries. Be brief.',
+              llm='gpt-4o-mini',
+              output='silent'
+          )
+          
+          # Create tasks
+          task1 = Task(
+              description='List 2 facts about Python programming',
+              agent=researcher,
+              expected_output='2 brief facts'
+          )
+          
+          task2 = Task(
+              description='Summarize the facts in one sentence',
+              agent=writer,
+              expected_output='One sentence summary'
+          )
+          
+          # Run workflow
+          print('Running multi-agent workflow...')
+          start = time.perf_counter()
+          
+          agents = Agents(agents=[researcher, writer], tasks=[task1, task2])
+          result = agents.start()
+          
+          elapsed = time.perf_counter() - start
+          
+          print(f'')
+          print(f'Multi-Agent Benchmark Results:')
+          print(f'  Total workflow time: {elapsed:.2f}s')
+          print(f'  Agents: 2')
+          print(f'  Tasks: 2')
+          print('✅ Multi-agent workflow completed successfully')
+          "
@@ -11,7 +11,8 @@
 """
 
 from praisonaiagents import Agent
-from praisonaiagents.tools import duckduckgo, wikipedia_tools
+from praisonaiagents import duckduckgo
+from praisonai_tools import wikipedia_tools
 from praisonaiagents.telemetry import (
     monitor_function, track_api_call, get_api_stats,
     get_slowest_functions, performance_monitor
 
@@ -1,29 +1,29 @@
 # PraisonAI Agents - Tools Benchmark Results
 
-**Generated:** 2025-12-18 14:40:35
+**Generated:** 2026-01-23 11:50:18
 **Iterations:** 100
 **Test:** Agent instantiation WITH TOOLS
 
 ## Results
 
 | Framework | Avg Time (μs) | Relative |
 |-----------|---------------|----------|
-| **PraisonAI** | **3.24** | **1.00x (fastest)** |
-| Agno | 5.12 | 1.58x |
-| PraisonAI (LiteLLM) | 8.59 | 2.65x |
-| OpenAI Agents SDK | 279.95 | 86.44x |
-| LangGraph | 2,310.82 | 713x |
-| CrewAI | 15,773.44 | 4,870x |
+| **PraisonAI** | **5.30** | **1.00x (fastest)** |
+| Agno | 5.62 | 1.06x |
+| PraisonAI (LiteLLM) | 11.08 | 2.09x |
+| OpenAI Agents SDK | 315.49 | 59.55x |
+| LangGraph | 2,511.95 | 474x |
+| CrewAI | 41,349.24 | 7,804x |
 
 ## Package Versions
 
 | Package | Version |
 |---------|--------|
-| PraisonAI | 0.1.5 |
-| Agno | 2.3.14 |
+| PraisonAI | 0.13.11 |
+| Agno | 2.4.2 |
 | OpenAI Agents SDK | 0.6.3 |
-| LangGraph | 1.0.5 |
-| CrewAI | 1.6.1 |
+| LangGraph | 1.0.7 |
+| CrewAI | 1.8.1 |
 
 ## How to Reproduce