Skip to content

Commit 395f9f7

Browse files
committed
agent eval updates
1 parent 7871f53 commit 395f9f7

File tree

1 file changed

+20
-21
lines changed

1 file changed

+20
-21
lines changed

articles/ai-foundry/concepts/evaluation-evaluators/rag-evaluators.md

Lines changed: 20 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -96,60 +96,59 @@ from azure.ai.evaluation import DocumentRetrievalEvaluator
9696
retrieval_ground_truth = [
9797
{
9898
"document_id": "1",
99-
"query_relevance_judgement": 4
99+
"query_relevance_label": 4
100100
},
101101
{
102102
"document_id": "2",
103-
"query_relevance_judgement": 2
103+
"query_relevance_label": 2
104104
},
105105
{
106106
"document_id": "3",
107-
"query_relevance_judgement": 3
107+
"query_relevance_label": 3
108108
},
109109
{
110110
"document_id": "4",
111-
"query_relevance_judgement": 1
111+
"query_relevance_label": 1
112112
},
113113
{
114114
"document_id": "5",
115-
"query_relevance_judgement": 0
115+
"query_relevance_label": 0
116116
},
117117
]
118118

119+
# these reterieval scores
119120
retrieved_documents = [
120121
{
121122
"document_id": "2",
122-
"query_relevance_judgement": 45.1
123+
"relevance_score": 45.1
123124
},
124125
{
125126
"document_id": "6",
126-
"query_relevance_judgement": 35.8
127+
"relevance_score": 35.8
127128
},
128129
{
129130
"document_id": "3",
130-
"query_relevance_judgement": 29.2
131+
"relevance_score": 29.2
131132
},
132133
{
133134
"document_id": "5",
134-
"query_relevance_judgement": 25.4
135+
"relevance_score": 25.4
135136
},
136137
{
137138
"document_id": "7",
138-
"query_relevance_judgement": 18.8
139+
"relevance_score": 18.8
139140
},
140141
]
141142

142-
default_threshold = {
143-
"ndcg@3": 0.5,
144-
"xdcg@3": 0.5,
145-
"fidelity": 0.5,
146-
"top1_relevance": 50,
147-
"top3_max_relevance": 50,
148-
"total_retrieved_documents": 50,
149-
"total_ground_truth_documents": 50,
150-
}
151-
152-
document_retrieval_evaluator = DocumentRetrievalEvaluator(threshold=default_threshold)
143+
document_retrieval_evaluator = DocumentRetrievalEvaluator(
144+
ndcg_threshold = 0.5,
145+
xdcg_threshold = 50.0,
146+
fidelity_threshold = 0.5,
147+
top1_relevance_threshold = 50.0,
148+
top3_max_relevance_threshold = 50.0,
149+
total_retrieved_documents_threshold = 50,
150+
total_ground_truth_documents_threshold = 50
151+
)
153152
document_retrieval_evaluator(retrieval_ground_truth=retrieval_ground_truth, retrieved_documents=retrieved_documents)
154153
```
155154

0 commit comments

Comments
 (0)