A way to output simulated qa in a format compatible with eval (#34479)

nagkumar91 · web-flow · commit a7868e9fccfe · 2024-02-28T14:46:10.000-08:00
* Changed the parameter from max_count to limit

* Add a method to have output in qa format from simulator

* simulation_result_limit was missing from main
diff --git a/sdk/ai/azure-ai-generative/azure/ai/generative/synthetic/simulator/simulator/_utils.py b/sdk/ai/azure-ai-generative/azure/ai/generative/synthetic/simulator/simulator/_utils.py
@@ -10,3 +10,19 @@ def to_json_lines(self):
         for item in self:
             json_lines += json.dumps(item) + "\n"
         return json_lines
+    
+    def to_eval_qa_json_lines(self):
+        json_lines = ""
+        for item in self:
+            user_message = None
+            assistant_message = None
+            for message in item['messages']:
+                if message['role'] == 'user':
+                    user_message = message['content']
+                elif message['role'] == 'assistant':
+                    assistant_message = message['content']
+            if user_message and assistant_message:
+                json_lines += json.dumps({'question': user_message, 'answer': assistant_message}) + "\n"
+        return json_lines
+
+        
diff --git a/sdk/ai/azure-ai-generative/azure/ai/generative/synthetic/simulator/simulator/simulator.py b/sdk/ai/azure-ai-generative/azure/ai/generative/synthetic/simulator/simulator/simulator.py
@@ -219,7 +219,8 @@ async def simulate_async(
         api_call_retry_limit: int = 3,
         api_call_retry_sleep_sec: int = 1,
         api_call_delay_sec: float = 0,
-        concurrent_async_task: int = 3
+        concurrent_async_task: int = 3,
+        simulation_result_limit: int = 3,
     ):
         """Asynchronously simulate conversations using the provided template and parameters
 
@@ -241,6 +242,8 @@ async def simulate_async(
         :paramtype api_call_delay_sec: float, optional
         :keyword concurrent_async_task: The maximum number of asynchronous tasks to run concurrently. Defaults to 3.
         :paramtype concurrent_async_task: int, optional
+        :keyword simulation_result_limit: The maximum number of simulation results to return. Defaults to 3.
+        :paramtype simulation_result_limit: int, optional
 
         :return: A list of dictionaries containing the simulation results.
         :rtype: List[Dict]
@@ -271,7 +274,6 @@ async def simulate_async(
         semaphore = asyncio.Semaphore(concurrent_async_task)
         sim_results = []
         tasks = []
-
         for t in templates:
             for p in t.template_parameters:
                 if jailbreak:
@@ -294,6 +296,12 @@ async def simulate_async(
                     )
                 )
 
+                if len(tasks) >= simulation_result_limit:
+                    break
+
+            if len(tasks) >= simulation_result_limit:
+                break
+
         sim_results = await asyncio.gather(*tasks)
 
         return JsonLineList(sim_results)
@@ -324,6 +332,8 @@ async def _simulate_async(
             api_call_delay_sec (float, optional): The time in seconds to wait between API calls. Defaults to 0.
             concurrent_async_task (int, optional): The maximum number of asynchronous tasks to run concurrently.
                 Defaults to 3.
+            simulation_result_limit (int, optional): The maximum number of simulation results to return. Defaults to 3.
+
         Returns:
             List[Dict]: A list of dictionaries containing the simulation results.