evalops
diff --git a/‎Dockerfile‎
Lines changed: 50 additions & 0 deletions b/‎Dockerfile‎
Lines changed: 50 additions & 0 deletions
diff --git a/‎ROADMAP.md‎
Lines changed: 146 additions & 0 deletions b/‎ROADMAP.md‎
Lines changed: 146 additions & 0 deletions
diff --git a/‎docker-compose.yml‎
Lines changed: 53 additions & 0 deletions b/‎docker-compose.yml‎
Lines changed: 53 additions & 0 deletions
diff --git a/‎examples/errors.yaml‎
Lines changed: 84 additions & 0 deletions b/‎examples/errors.yaml‎
Lines changed: 84 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 7 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎src/mocktopus/core.py‎
Lines changed: 5 additions & 1 deletion b/‎src/mocktopus/core.py‎
Lines changed: 5 additions & 1 deletion
@@ -0,0 +1,50 @@
+# Multi-stage build for smaller image
+FROM python:3.11-slim as builder
+
+WORKDIR /app
+
+# Install build dependencies
+RUN apt-get update && apt-get install -y \
+    gcc \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy requirements
+COPY pyproject.toml ./
+COPY src/ ./src/
+
+# Install package
+RUN pip install --no-cache-dir -e .
+
+# Runtime stage
+FROM python:3.11-slim
+
+WORKDIR /app
+
+# Copy installed package from builder
+COPY --from=builder /usr/local/lib/python3.11/site-packages /usr/local/lib/python3.11/site-packages
+COPY --from=builder /usr/local/bin/mocktopus /usr/local/bin/mocktopus
+
+# Copy source code (for editable install)
+COPY src/ ./src/
+COPY pyproject.toml ./
+COPY examples/ ./examples/
+
+# Create directories for recordings and scenarios
+RUN mkdir -p /data/recordings /data/scenarios
+
+# Install runtime package
+RUN pip install --no-cache-dir -e .
+
+# Expose default port
+EXPOSE 8080
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=3s --start-period=5s --retries=3 \
+    CMD python -c "import urllib.request; urllib.request.urlopen('http://localhost:8080/health')" || exit 1
+
+# Default scenario location
+ENV SCENARIO_PATH=/data/scenarios/scenario.yaml
+ENV RECORDINGS_DIR=/data/recordings
+
+# Run server by default
+CMD ["mocktopus", "serve", "-s", "${SCENARIO_PATH}", "--host", "0.0.0.0"]
@@ -0,0 +1,146 @@
+# 🗺️ Mocktopus Roadmap
+
+## Current State (v0.1.0)
+✅ Basic HTTP server mimicking OpenAI/Anthropic APIs
+✅ YAML-based scenarios with pattern matching
+✅ Streaming support (SSE)
+✅ Tool/function calling
+✅ CLI with serve, validate, simulate commands
+
+## Phase 1: Core Features (v0.2.0) - Q1 2024
+### Record & Replay
+- [ ] Implement request proxy to real APIs
+- [ ] Store interactions in SQLite/JSON
+- [ ] Intelligent replay matching
+- [ ] Sensitive data filtering
+- [ ] Compression for stored data
+
+### Additional APIs
+- [ ] Embeddings API (/v1/embeddings)
+- [ ] Legacy Completions API (/v1/completions)
+- [ ] Models endpoint with proper data
+- [ ] Error response mocking
+
+### Testing Improvements
+- [ ] Integration tests with OpenAI SDK
+- [ ] Integration tests with Anthropic SDK
+- [ ] Performance benchmarks
+- [ ] Load testing capabilities
+
+## Phase 2: Intelligence (v0.3.0) - Q2 2024
+### Semantic Matching
+- [ ] Vector similarity matching using embeddings
+- [ ] Fuzzy matching with configurable thresholds
+- [ ] Intent-based routing
+- [ ] Context-aware responses
+
+### Stateful Conversations
+- [ ] Conversation state tracking
+- [ ] Multi-turn dialogue support
+- [ ] Variable extraction and storage
+- [ ] Conditional response logic
+
+### Response Templating
+- [ ] Jinja2-style templates
+- [ ] Dynamic variable injection
+- [ ] Helper functions (uuid, timestamp, random)
+- [ ] Request data access in templates
+
+## Phase 3: Developer Experience (v0.4.0) - Q2 2024
+### Web Dashboard
+- [ ] Real-time request inspector
+- [ ] Visual scenario builder
+- [ ] Mock rule debugger
+- [ ] Performance metrics dashboard
+- [ ] Cost tracking visualization
+
+### SDK Integrations
+- [ ] LangChain integration & examples
+- [ ] LlamaIndex integration & examples
+- [ ] Vercel AI SDK examples
+- [ ] Haystack integration
+- [ ] AutoGen examples
+
+### Deployment
+- [ ] Docker image with multi-arch support
+- [ ] Kubernetes Helm chart
+- [ ] GitHub Action for CI integration
+- [ ] Cloud Run button
+- [ ] Railway/Render templates
+
+## Phase 4: Advanced Features (v0.5.0) - Q3 2024
+### Assistants API
+- [ ] Full Assistants API support
+- [ ] Thread management
+- [ ] File handling
+- [ ] Code interpreter mocking
+- [ ] Function calling in assistants
+
+### Vision & Audio
+- [ ] Image input support
+- [ ] Vision API mocking
+- [ ] Audio transcription mocking
+- [ ] TTS mocking
+
+### Chaos Engineering
+- [ ] Random failure injection
+- [ ] Latency simulation
+- [ ] Partial failures
+- [ ] Network issues simulation
+- [ ] Rate limit simulation
+
+## Phase 5: Enterprise (v1.0.0) - Q4 2024
+### Security & Compliance
+- [ ] Authentication (API keys, JWT)
+- [ ] Request filtering/whitelisting
+- [ ] Audit logging
+- [ ] PII detection and masking
+- [ ] Compliance reporting
+
+### Scalability
+- [ ] Distributed mode with Redis
+- [ ] Horizontal scaling support
+- [ ] Connection pooling
+- [ ] Cache layer
+- [ ] Performance optimizations
+
+### Observability
+- [ ] Prometheus metrics
+- [ ] OpenTelemetry support
+- [ ] Detailed logging
+- [ ] Health check endpoints
+- [ ] Performance profiling
+
+## Future Ideas (v2.0+)
+- **WebSocket Support**: Real-time streaming applications
+- **GraphQL Mocking**: For GraphQL-based LLM APIs
+- **Plugin Marketplace**: Community-contributed plugins
+- **Cloud Service**: Hosted Mocktopus SaaS
+- **Test Generation**: Auto-generate test scenarios from production logs
+- **Smart Fuzzing**: Automatic edge case discovery
+- **Multi-Language SDKs**: Go, Rust, Java, Ruby clients
+- **OpenAPI Generator**: Generate mocks from OpenAPI specs
+- **Behavior Learning**: Learn patterns from real API usage
+- **Cost Optimization**: Suggest cheaper model alternatives
+
+## Contributing
+Want to help? Check our [CONTRIBUTING.md](CONTRIBUTING.md) for:
+- 🐛 Bug fixes
+- ✨ Feature implementations
+- 📚 Documentation improvements
+- 🧪 Test coverage
+- 🎨 UI/UX improvements
+
+## Metrics for Success
+- **Adoption**: 1000+ GitHub stars
+- **Usage**: 100+ companies using in CI/CD
+- **Performance**: <10ms response time for mocks
+- **Coverage**: 100% OpenAI API compatibility
+- **Reliability**: 99.9% uptime for hosted version
+- **Cost Savings**: $1M+ saved by users annually
+
+## Get Involved
+- 💬 [Discord Community](https://discord.gg/mocktopus)
+- 🐦 [Twitter Updates](https://twitter.com/mocktopus)
+- 📧 [Newsletter](https://mocktopus.dev/newsletter)
+- 🎥 [YouTube Tutorials](https://youtube.com/@mocktopus)
@@ -0,0 +1,53 @@
+version: '3.8'
+
+services:
+  mocktopus:
+    build: .
+    image: mocktopus:latest
+    container_name: mocktopus
+    ports:
+      - "8080:8080"
+    volumes:
+      # Mount scenarios directory
+      - ./examples:/data/scenarios:ro
+      # Mount recordings directory for record/replay
+      - ./recordings:/data/recordings
+    environment:
+      # Default to mock mode
+      - MODE=mock
+      # Use chat-basic.yaml as default scenario
+      - SCENARIO_PATH=/data/scenarios/chat-basic.yaml
+      # Optional: Set API keys for record mode
+      # - OPENAI_API_KEY=your-key-here
+      # - ANTHROPIC_API_KEY=your-key-here
+    command: >
+      mocktopus serve
+      -s ${SCENARIO_PATH}
+      --mode ${MODE}
+      --recordings-dir /data/recordings
+      --host 0.0.0.0
+      -v
+    restart: unless-stopped
+    networks:
+      - mocktopus-net
+
+  # Optional: Add a test client service
+  test-client:
+    image: python:3.11-slim
+    container_name: mocktopus-test
+    depends_on:
+      - mocktopus
+    volumes:
+      - ./tests:/tests
+    environment:
+      - MOCKTOPUS_URL=http://mocktopus:8080
+    command: sleep infinity
+    networks:
+      - mocktopus-net
+
+networks:
+  mocktopus-net:
+    driver: bridge
+
+volumes:
+  recordings:
@@ -0,0 +1,84 @@
+version: 1
+meta:
+  description: Error scenario examples for testing error handling
+  author: Mocktopus
+
+rules:
+  # Rate limit error
+  - type: llm.openai
+    when:
+      messages_contains: "rate limit test"
+    error:
+      error_type: "rate_limit"
+      message: "Rate limit exceeded. Please retry after some time."
+      status_code: 429
+      retry_after: 60
+      delay_ms: 100
+
+  # Authentication error
+  - type: llm.openai
+    when:
+      messages_contains: "auth test"
+    error:
+      error_type: "authentication"
+      message: "Invalid API key provided"
+      status_code: 401
+
+  # Invalid request error
+  - type: llm.openai
+    when:
+      messages_contains: "invalid request"
+    error:
+      error_type: "invalid_request"
+      message: "The model 'gpt-5' does not exist"
+      status_code: 400
+
+  # Timeout simulation
+  - type: llm.openai
+    when:
+      messages_contains: "timeout test"
+    error:
+      error_type: "timeout"
+      message: "Request timed out after 30 seconds"
+      status_code: 504
+      delay_ms: 5000  # Wait 5 seconds then return timeout
+
+  # Server error
+  - type: llm.openai
+    when:
+      messages_contains: "server error"
+    error:
+      error_type: "server_error"
+      message: "Internal server error occurred"
+      status_code: 500
+
+  # Intermittent error (fails 2 times, then works)
+  - type: llm.openai
+    when:
+      messages_contains: "retry test"
+    times: 2
+    error:
+      error_type: "server_error"
+      message: "Temporary server issue"
+      status_code: 503
+
+  # After errors exhausted, this rule handles success
+  - type: llm.openai
+    when:
+      messages_contains: "retry test"
+    respond:
+      content: "Success after retries!"
+      usage:
+        input_tokens: 10
+        output_tokens: 5
+
+  # Custom error
+  - type: llm.openai
+    when:
+      messages_contains: "custom error"
+    error:
+      error_type: "content_filter"
+      message: "Content was blocked by safety filters"
+      code: "content_filtered"
+      status_code: 422
+      delay_ms: 200
@@ -30,5 +30,12 @@ packages = ["src/mocktopus"]
 line-length = 100
 target-version = "py39"
 
+[project.optional-dependencies]
+test = [
+    "pytest>=7.0",
+    "pytest-asyncio>=0.21",
+]
+
 [tool.pytest.ini_options]
 addopts = "-q"
+asyncio_mode = "auto"
@@ -16,6 +16,7 @@ class Rule:
     when: Dict[str, Any]
     respond: Dict[str, Any]
     times: Optional[int] = None  # None => unlimited
+    error: Optional[Dict[str, Any]] = None  # Error response config
     _remaining: Optional[int] = field(default=None, init=False, repr=False)
 
     def ok_to_use(self) -> bool:
@@ -101,7 +102,9 @@ def _llm_rule_matches(self, rule: Rule, *, model: str, messages: List[Dict[str,
     def find_llm(self, *, model: str, messages: List[Dict[str, Any]]) -> Tuple[Optional[Rule], Optional[Dict[str, Any]]]:
         for rule in self.rules:
             if self._llm_rule_matches(rule, model=model, messages=messages):
-                return rule, rule.respond
+                # Return error config if present, otherwise normal response
+                response_config = rule.error if rule.error else rule.respond
+                return rule, response_config
         return None, None
 
     # --- YAML I/O ---------------------------------------------------------
@@ -122,6 +125,7 @@ def from_yaml(cls, path: str) -> "Scenario":
                     when=r.get("when", {}) or {},
                     respond=r.get("respond", {}) or {},
                     times=r.get("times"),
+                    error=r.get("error"),
                 )
             )
         meta = data.get("meta", {})