You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Add support for Built-in Tools for the Tool Call Accuracy Evaluator (#42359)
* support 5 levels, evaluate all tools at once
* Update sample notebook and change log
* Add missing import
* Modify test cases to match the new output format
* Modify other test file to match the new output format
* Fixed parsing of results
* Change key name in output
* Spell check fixes
* Minor prompt update
* Update result key to tool_call_accuracy
* Delete test_new_evaluator.ipynb
* Added field names and messages as constants
* Additional note in prompt
* Re-add the temperature to the prompty file
* Removed 'applicable' field and print statement
* Move excess/missing tool calls fields under additional details
* Typo fix and removal of redundant field in the prompt
* Modify per_tool_call_details field's name to details
* Revert "Modify per_tool_call_details field's name to details"
This reverts commit 2c3ce50.
* Revert 'Merge branch 'main' into selshafey/improve_tool_call_accuracy'
* Black reformat
* Reformat with black
* To re-trigger build pipelines
* Add notebook for bugbash
* modify bugbash notebook
* Add support for built-in tools for Tool Call Accuracy Evaluator
* Remove bugbash notebook
* Resolve issues with merge
* Fix id value
* Use existing built-in tool definitions
* Run black
* Prompt modifications
* Add test cases for built-in tools
* Handle converter format
* Add test cases for converter format
* Support only converter format
* Revert tool definitions to be required, run black
---------
Co-authored-by: Salma Elshafey <[email protected]>
Copy file name to clipboardExpand all lines: sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_converters/_models.py
+29-1Lines changed: 29 additions & 1 deletion
Original file line number
Diff line number
Diff line change
@@ -33,9 +33,12 @@
33
33
# Constants to only be used internally in this file for the built-in tools.
34
34
_CODE_INTERPRETER="code_interpreter"
35
35
_BING_GROUNDING="bing_grounding"
36
+
_BING_CUSTOM_SEARCH="bing_custom_search"
36
37
_FILE_SEARCH="file_search"
37
38
_AZURE_AI_SEARCH="azure_ai_search"
39
+
_SHAREPOINT_GROUNDING="sharepoint_grounding"
38
40
_FABRIC_DATAAGENT="fabric_dataagent"
41
+
_OPENAPI="openapi"
39
42
40
43
# Built-in tool descriptions and parameters are hidden, but we include basic descriptions
41
44
# for evaluation purposes.
@@ -44,9 +47,12 @@
44
47
+"generate code, and create graphs and charts using your data. Supports "
45
48
+"up to 20 files.",
46
49
_BING_GROUNDING: "Enhance model output with web data.",
47
-
_FILE_SEARCH: "Search for data across uploaded files.",
50
+
_BING_CUSTOM_SEARCH: "Enables agents to retrieve content from a curated subset of websites, enhancing relevance and reducing noise from public web searches.",
51
+
_FILE_SEARCH: "Search for data across uploaded files. A single call can return multiple results/files in the 'results' field.",
48
52
_AZURE_AI_SEARCH: "Search an Azure AI Search index for relevant data.",
53
+
_SHAREPOINT_GROUNDING: "Allows agents to access and retrieve relevant content from Microsoft SharePoint document libraries, grounding responses in organizational knowledge.",
49
54
_FABRIC_DATAAGENT: "Connect to Microsoft Fabric data agents to retrieve data across different data sources.",
55
+
_OPENAPI: "Connects agents to external RESTful APIs using OpenAPI 3.0 specifications, enabling seamless access to third-party services.",
50
56
}
51
57
52
58
# Built-in tool parameters are hidden, but we include basic parameters for evaluation purposes.
@@ -59,6 +65,15 @@
59
65
"type": "object",
60
66
"properties": {"requesturl": {"type": "string", "description": "URL used in Bing Search API."}},
61
67
},
68
+
_BING_CUSTOM_SEARCH: {
69
+
"type": "object",
70
+
"properties": {
71
+
"requesturl": {
72
+
"type": "string",
73
+
"description": "Search queries, along with pre-configured site restrictions or domain filters.",
74
+
}
75
+
},
76
+
},
62
77
_FILE_SEARCH: {
63
78
"type": "object",
64
79
"properties": {
@@ -76,10 +91,23 @@
76
91
"type": "object",
77
92
"properties": {"input": {"type": "string", "description": "Search terms to use."}},
78
93
},
94
+
_SHAREPOINT_GROUNDING: {
95
+
"type": "object",
96
+
"properties": {
97
+
"input": {"type": "string", "description": "A natural language query to search SharePoint content."}
98
+
},
99
+
},
79
100
_FABRIC_DATAAGENT: {
80
101
"type": "object",
81
102
"properties": {"input": {"type": "string", "description": "Search terms to use."}},
82
103
},
104
+
_OPENAPI: {
105
+
"type": "object",
106
+
"properties": {
107
+
"name": {"type": "string", "description": "The name of the function to call."},
108
+
"arguments": {"type": "string", "description": "JSON string of the arguments to pass to the function."},
Copy file name to clipboardExpand all lines: sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py
0 commit comments