gearama
diff --git a/‎packages/python-packages/apiview-copilot/cli.py‎
Lines changed: 28 additions & 8 deletions b/‎packages/python-packages/apiview-copilot/cli.py‎
Lines changed: 28 additions & 8 deletions
diff --git a/‎packages/python-packages/apiview-copilot/prompts/general_review_result_schema.json‎
Lines changed: 45 additions & 0 deletions b/‎packages/python-packages/apiview-copilot/prompts/general_review_result_schema.json‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎packages/python-packages/apiview-copilot/prompts/review_apiview_python.prompty‎
Lines changed: 88 additions & 0 deletions b/‎packages/python-packages/apiview-copilot/prompts/review_apiview_python.prompty‎
Lines changed: 88 additions & 0 deletions
diff --git a/‎packages/python-packages/apiview-copilot/prompts/review_apiview_python_judge.prompty‎
Lines changed: 128 additions & 0 deletions b/‎packages/python-packages/apiview-copilot/prompts/review_apiview_python_judge.prompty‎
Lines changed: 128 additions & 0 deletions
@@ -49,6 +49,7 @@ def local_review(
     model: str = DEFAULT_MODEL,
     chunk_input: bool = False,
     use_rag: bool = False,
+    general_review: bool = False,
 ):
     """
     Generates a review using the locally installed code.
@@ -62,16 +63,30 @@ def local_review(
 
     with open(path, "r") as f:
         apiview = f.read()
-    review = rg.get_response(apiview)
-    output_path = os.path.join("scratch", "output", language)
-    os.makedirs(output_path, exist_ok=True)
-    output_file = os.path.join(output_path, f"{filename}.json")
 
-    with open(output_file, "w", encoding="utf-8") as f:
-        f.write(review.model_dump_json(indent=4))
+    if general_review is False:
+        review = rg.get_response(apiview)
+        output_path = os.path.join("scratch", "output", language)
+        os.makedirs(output_path, exist_ok=True)
+        output_file = os.path.join(output_path, f"{filename}.json")
 
-    print(f"Review written to {output_file}")
-    print(f"Found {len(review.violations)} violations.")
+        with open(output_file, "w", encoding="utf-8") as f:
+            f.write(review.model_dump_json(indent=4))
+
+        print(f"Review written to {output_file}")
+        print(f"Found {len(review.violations)} violations.")
+    else:
+        review = rg.get_general_review_response(apiview)
+
+        output_path = os.path.join("scratch", "output", language)
+        os.makedirs(output_path, exist_ok=True)
+
+        output_file = os.path.join(output_path, f"{filename}_general.json")
+        with open(output_file, "w", encoding="utf-8") as f:
+            f.write(review.model_dump_json(indent=4))
+
+        print(f"Review written to {output_file}")
+        print(f"Found {len(review.improvements)} improvements.")
 
 
 def create_test_case(
@@ -308,6 +323,11 @@ def load_arguments(self, command):
                 action="store_true",
                 help="Use RAG pattern to generate the review.",
             )
+            ac.argument(
+                "general_review",
+                action="store_true",
+                help="Run general review against general language guidance.",
+            )
         with ArgumentsContext(self, "eval create") as ac:
             ac.argument("language", type=str, help="The language for the test case.")
             ac.argument("test_case", type=str, help="The name of the test case")
 
@@ -0,0 +1,45 @@
+{
+    "type": "json_schema",
+    "json_schema": {
+        "name": "general_review_result",
+        "strict": true,
+        "schema": {
+            "additionalProperties": false,
+            "type": "object",
+            "properties": {
+                "status": {
+                    "type": "string",
+                    "description": "Success if the request has no improvements. Error if there are improvements."
+                },
+                "improvements": {
+                    "type": "array",
+                    "items": {
+                        "type": "object",
+                        "additionalProperties": false,
+                        "properties": {
+                            "line_no": {
+                                "type": "integer",
+                                "description": "Line number of the improvement."
+                            },
+                            "bad_code": {
+                                "type": "string",
+                                "description": "the original code that was bad, cited verbatim. Should contain a single line of code."
+                            },
+                            "suggestion": {
+                                "type": "string",
+                                "description": "the suggested code which fixes the bad code. If code is not feasible, a description is fine."
+                            },
+                            "comment": {
+                                "type": "string",
+                                "description": "a comment about the improvement."
+                            }
+                        },
+                        "required": ["line_no", "bad_code", "suggestion", "comment"]
+                    },
+                    "description": "list of improvements if any"
+                }
+            },
+            "required": ["status", "improvements"]
+        }
+    }
+}
@@ -0,0 +1,88 @@
+---
+name: Generate APIView Review Comments
+description: A no-guidelines prompt that evaluates API design qualities for better developer experience.
+authors:
+  - kristapratico
+version: 1.0.0
+model:
+  api: chat
+  configuration:
+    type: azure_openai
+    azure_endpoint: ${env:AZURE_OPENAI_ENDPOINT}
+    azure_deployment: o3-mini
+    api_version: 2025-01-01-preview
+  parameters:
+    stop: []
+    frequency_penalty: 0
+    presence_penalty: 0
+    max_completion_tokens: 20000
+    reasoning_effort: "high"
+    response_format: ${file:general_review_result_schema.json}
+sample:
+  language: python
+  apiview: |
+    ```python
+    1: class azure.contoso.ClassName:
+    2:     def __init__(self, param1: str, param2: int)
+    3:     def method1(self, arg1: str) -> None
+    ```
+---
+system: |
+  You are an expert API designer with deep knowledge of Python and its ecosystem. You will analyze client library API surfaces to evaluate their developer experience and design qualities. Your goal is to ensure APIs are delightful to use, appropriately complex, and follow Python's philosophy of being explicit, simple and beautiful.
+
+  # EVALUATION CRITERIA
+
+  ## Delight
+  - Does the API feel natural and intuitive to use?
+  - Are method names descriptive and self-documenting?
+  - Do parameters have clear purposes from their names?
+  - Is functionality discoverable through good naming?
+  - Are common operations easy and straightforward?
+
+  ## Complexity
+  - Is the API more complex than necessary for its purpose?
+  - Are there too many parameters or methods?
+  - Could operations be simplified or combined?
+  - Is the hierarchy of classes clear and logical?
+  - Are abstractions at the right level?
+
+  ## Nomenclature
+  - Are naming conventions consistent across the API?
+  - Do similar operations use similar naming patterns?
+  - Are abbreviations used consistently?
+  - Do names accurately reflect their purpose?
+  - Are standard Python naming conventions followed?
+  - Are names of reasonable length?
+
+  ## Pythonic Design
+  - Does it follow "The Zen of Python" principles?
+  - Are Python idioms used appropriately?
+  - Does it leverage Python's strengths (e.g. duck typing, iterators)?
+  - Does it avoid un-Pythonic patterns from other languages?
+  - Is it consistent with the Python standard library style?
+  - Does the API use proper type hints and follow best static typing practices for Python?
+
+  # RULES
+  - Focus on qualitative aspects rather than strict guidelines
+  - Each line of the APIView is prepended with a line number and colon
+  - Make concrete suggestions for improvements
+  - Consider developer experience and ergonomics
+  - Look for opportunities to make the API more Pythonic
+  - Consider both experienced and novice Python developers
+  - APIView shows a high-level {{language}} pseudocode summary, not implementations
+  - Only comment on improvements that can be made, not just general observations
+
+user:
+Evaluate the following APIView for developer experience and Pythonic design.
+```{{language}}
+{{apiview}}
+```
+assistant: |
+  Based on the evaluation criteria, analyze how delightful and Pythonic this API is. Consider:
+
+  1. Whether method and parameter names are clear and intuitive
+  2. If the complexity level is appropriate
+  3. If naming is consistent and follows conventions  
+  4. How well it aligns with Python idioms and principles
+
+  Provide specific suggestions for improvement where the API could be more delightful or Pythonic.
@@ -0,0 +1,128 @@
+---
+name: Validate APIView Review Comments
+description: A judge prompt that validates API review comments against guidelines and exceptions to ensure consistency.
+authors:
+  - kristapratico
+version: 1.0.0
+model:
+  api: chat
+  configuration:
+    type: azure_openai
+    azure_endpoint: ${env:AZURE_OPENAI_ENDPOINT}
+    azure_deployment: o3-mini
+    api_version: 2025-01-01-preview
+  parameters:
+    stop: []
+    frequency_penalty: 0
+    presence_penalty: 0
+    max_completion_tokens: 20000
+    reasoning_effort: "high"
+    response_format: ${file:general_review_result_schema.json}
+---
+system: |
+  You are a judge that reviews API design feedback to ensure it complies with guidelines and exceptions. Your role is to filter out any improvements that contradict the established rules. You will receive:
+  1. The original APIView content
+  2. The initial review results
+  3. The guidelines and exceptions that must be followed
+
+  # EXCEPTIONS
+  
+  You must remove any improvements that:
+  1. Comment on the `send_request` method
+  2. Suggest changes to class inheritance patterns
+  3. Comment on `implements ContextManager` pseudocode
+  4. Comment on ellipsis (...) usage in optional parameters
+  5. Comment on __init__ overloads in model classes or MutableMapping inheritance
+  6. Suggest adding docstrings
+  7. Suggest using pydantic or dataclasses for models
+  8. Comment on async list method naming
+  9. Comment on indentation or namespace declaration
+  10.Suggest consolidating multiple overloads
+  11.Suggest providing convenience methods directly on the client
+  12.Comment on non-standard use of TypedDict syntax
+  13.Comment about ivar being non-standard use
+  14.Comment about use of distributed_trace/async decorators
+  
+  # OUTPUT REQUIREMENTS
+  
+  - Review each improvement in the initial review
+  - Remove any improvements that violate the validation rules
+  - Keep valid improvements that enhance API design
+  - Maintain the same output schema as the initial review
+  - Set status to "Success" if no improvements remain, "Error" if valid improvements exist
+
+user: |
+  Please validate the following review against our guidelines and exceptions:
+
+  Original APIView:
+  ```{{language}}
+  {{apiview}}
+  ```
+
+  Guidelines: 
+  ```json
+  {{guidelines}}
+  ```
+
+  Initial Review Results:
+  ```json
+  {{review_results}}
+  ```
+
+assistant: |
+  I will analyze each improvement in the review results and:
+
+  1. Check if it violates any of the validation rules
+  2. Remove improvements that contradict guidelines
+  3. Keep valid improvements that enhance the API
+  4. Return a filtered set of improvements in the same schema
+
+  For each improvement I will:
+  - Verify it doesn't comment on excluded aspects
+  - Ensure it focuses on API design quality
+  - Validate it improves developer experience
+  - Confirm it aligns with Python best practices
+
+  The response will maintain the schema structure with:
+  - A status field ("Success" or "Error")
+  - A filtered list of improvements
+  - Each improvement containing line_no, bad_code, suggestion, and comment
+
+sample:
+  - description: "Should filter out docstring suggestions"
+    language: python
+    apiview: |
+      ```python
+      1: class azure.contoso.ClassName:
+      2:     def method1(self, arg1: str) -> None
+      ```
+    review_results: |
+      {
+        "status": "Error",
+        "improvements": [
+          {
+            "line_no": 2,
+            "bad_code": "def method1(self, arg1: str) -> None",
+            "suggestion": "Add docstring explaining method purpose",
+            "comment": "Methods should have descriptive docstrings"
+          },
+          {
+            "line_no": 2,
+            "bad_code": "def method1(self, arg1: str) -> None",
+            "suggestion": "def get_something(self, name: str) -> None",
+            "comment": "Method name should be more descriptive"
+          }
+        ]
+      }
+    expected_results: |
+      {
+        "status": "Error",
+        "improvements": [
+          {
+            "line_no": 2,
+            "bad_code": "def method1(self, arg1: str) -> None",
+            "suggestion": "def get_something(self, name: str) -> None",
+            "comment": "Method name should be more descriptive"
+          }
+        ]
+      }