feat(cohere): auto trace cohere

jalexanderII · jalexanderII · commit 5ed5c099d9f6 · 2024-07-30T13:31:41.000-04:00
diff --git a/cookbook/ab_testing.py b/cookbook/ab_testing.py
@@ -1,15 +1,16 @@
+from typing import Tuple
+
 import os
 import random
-from typing import Tuple
 
 from openai import OpenAI
 
-from parea import trace, trace_insert, Parea, get_current_trace_id
+from parea import Parea, get_current_trace_id, trace, trace_insert
 from parea.schemas import FeedbackRequest
 
 client = OpenAI()
 # instantiate Parea client
-p = Parea(api_key=os.getenv('PAREA_API_KEY'))
+p = Parea(api_key=os.getenv("PAREA_API_KEY"))
 # wrap OpenAI client to trace calls
 p.wrap_openai_client(client)
 
@@ -19,28 +20,32 @@ def generate_email(user: str) -> Tuple[str, str]:
     """Randomly chooses a prompt to perform an A/B test for generating email. Returns the email and the trace ID.
     The latter is used to tie-back the collected feedback from the user."""
     if random.random() < 0.5:
-        trace_insert({'metadata': {'ab_test_0': 'variant_0'}})
-        prompt = f'Generate a long email for {user}'
+        trace_insert({"metadata": {"ab_test_0": "variant_0"}})
+        prompt = f"Generate a long email for {user}"
     else:
-        trace_insert({'metadata': {'ab_test_0': 'variant_1'}})
-        prompt = f'Generate a short email for {user}'
-
-    email = client.chat.completions.create(
-        model="gpt-4o",
-        messages=[
-            {
-                "role": "user",
-                "content": prompt,
-            }
-        ],
-    ).choices[0].message.content
+        trace_insert({"metadata": {"ab_test_0": "variant_1"}})
+        prompt = f"Generate a short email for {user}"
+
+    email = (
+        client.chat.completions.create(
+            model="gpt-4o",
+            messages=[
+                {
+                    "role": "user",
+                    "content": prompt,
+                }
+            ],
+        )
+        .choices[0]
+        .message.content
+    )
 
     return email, get_current_trace_id()
 
 
 def main():
     # generate email and get trace ID
-    email, trace_id = generate_email('Max Mustermann')
+    email, trace_id = generate_email("Max Mustermann")
 
     # log user feedback on email using trace ID
     p.record_feedback(
@@ -51,5 +56,5 @@ def main():
     )
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     main()
diff --git a/cookbook/cohere/trace_cohere.py b/cookbook/cohere/trace_cohere.py
@@ -0,0 +1,44 @@
+import os
+
+import cohere
+from dotenv import load_dotenv
+
+from parea import Parea
+
+load_dotenv()
+
+p = Parea(api_key=os.getenv("PAREA_API_KEY"))
+co = cohere.Client(api_key=os.getenv("COHERE_API_KEY"))
+p.wrap_cohere_client(co)
+
+response = co.chat(
+    model="command-r-plus",
+    preamble="You are a helpful assistant talking in JSON.",
+    message="Generate a JSON describing a person, with the fields 'name' and 'age'",
+    response_format={"type": "json_object"},
+)
+print(response)
+print("\n\n")
+
+response = co.chat(message="Who discovered gravity?")
+print(response)
+print("\n\n")
+#
+docs = [
+    "Carson City is the capital city of the American state of Nevada.",
+    "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean. Its capital is Saipan.",
+    "Capitalization or capitalisation in English grammar is the use of a capital letter at the start of a word. English usage varies from capitalization in other languages.",
+    "Washington, D.C. (also known as simply Washington or D.C., and officially as the District of Columbia) is the capital of the United States. It is a federal district.",
+    "Capital punishment (the death penalty) has existed in the United States since beforethe United States was a country. As of 2017, capital punishment is legal in 30 of the 50 states.",
+]
+response = co.rerank(
+    model="rerank-english-v3.0",
+    query="What is the capital of the United States?",
+    documents=docs,
+    top_n=3,
+)
+print(response)
+print("\n\n")
+
+for event in co.chat_stream(message="Who discovered gravity?"):
+    print(event)
diff --git a/cookbook/cohere/tracing_with_cohere.py b/cookbook/cohere/tracing_with_cohere.py
@@ -0,0 +1,82 @@
+from typing import List, Optional
+
+import os
+from datetime import datetime
+
+import cohere
+from dotenv import load_dotenv
+
+from parea import Parea, trace, trace_insert
+
+load_dotenv()
+
+p = Parea(api_key=os.getenv("PAREA_API_KEY"))
+co = cohere.Client(api_key=os.getenv("COHERE_API_KEY"))
+p.wrap_cohere_client(co)
+
+
+def call_llm(message: str, chat_history: Optional[List[dict]] = None, system_message: str = "", model: str = "command-r-plus") -> str:
+    return co.chat(
+        model=model,
+        preamble=system_message,
+        chat_history=chat_history or [],
+        message=message,
+    ).text
+
+
+@trace
+def argumentor(query: str, additional_description: str = "") -> str:
+    return call_llm(
+        system_message=f"""You are a debater making an argument on a topic. {additional_description}.
+        The current time is {datetime.now().strftime("%Y-%m-%d")}""",
+        message=f"The discussion topic is {query}",
+    )
+
+
+@trace
+def critic(argument: str) -> str:
+    return call_llm(
+        system_message="""You are a critic.
+                What unresolved questions or criticism do you have after reading the following argument?
+                Provide a concise summary of your feedback.""",
+        message=argument,
+    )
+
+
+@trace
+def refiner(query: str, additional_description: str, argument: str, criticism: str) -> str:
+    return call_llm(
+        system_message=f"""You are a debater making an argument on a topic. {additional_description}.
+                The current time is {datetime.now().strftime("%Y-%m-%d")}""",
+        chat_history=[{"role": "USER", "message": f"""The discussion topic is {query}"""}, {"role": "CHATBOT", "message": argument}, {"role": "USER", "message": criticism}],
+        message="Please generate a new argument that incorporates the feedback from the user.",
+    )
+
+
+@trace
+def argument_chain(query: str, additional_description: str = "") -> str:
+    trace_insert({"session_id": "cus_1234", "end_user_identifier": "user_1234"})
+    argument = argumentor(query, additional_description)
+    criticism = critic(argument)
+    refined_argument = refiner(query, additional_description, argument, criticism)
+    return refined_argument
+
+
+@trace(session_id="cus_1234", end_user_identifier="user_1234")
+def json_call() -> str:
+    completion = co.chat(
+        model="command-r-plus",
+        preamble="You are a helpful assistant talking in JSON.",
+        message="What are you?",
+        response_format={"type": "json_object"},
+    )
+    return completion.text
+
+
+if __name__ == "__main__":
+    result = argument_chain(
+        "Whether sparkling wine is good for you.",
+        additional_description="Provide a concise, few sentence argument on why sparkling wine is good for you.",
+    )
+    # print(result)
+    # print(json_call())
diff --git a/cookbook/langchain/trace_class_call_method.py b/cookbook/langchain/trace_class_call_method.py
@@ -12,6 +12,10 @@
 
 p = Parea(api_key=os.getenv("PAREA_API_KEY"))
 
+from langsmith.evaluation import LangChainStringEvaluator
+
+qa_evaluator = [LangChainStringEvaluator("cot_qa")]
+
 
 class LangChainModule:
     handler = PareaAILangchainTracer()
diff --git a/parea/client.py b/parea/client.py
@@ -118,6 +118,13 @@ def wrap_anthropic_client(self, client: "Anthropic", integration: Optional[str]
         if integration:
             self._add_integration(integration)
 
+    def wrap_cohere_client(self, client: Union["cohere.Client", "cohere.AsyncClient"], integration: Optional[str] = None) -> None:
+        from parea.wrapper.cohere.wrap_cohere import CohereClientWrapper
+
+        CohereClientWrapper().init(client=client)
+        if integration:
+            self._add_integration(integration)
+
     def _add_integration(self, integration: str) -> None:
         self._client.add_integration(integration)
 
diff --git a/parea/constants.py b/parea/constants.py
@@ -371,7 +371,78 @@ def str2bool(v):
         "completion": 15.00,
     },
 }
-ALL_NON_AZURE_MODELS_INFO = {**OPENAI_MODEL_INFO, **ANTHROPIC_MODEL_INFO}
+COHERE_MODEL_INFO: Dict[str, Dict[str, Union[float, int, Dict[str, int]]]] = {
+    "command-r-plus": {
+        "prompt": 3.0,
+        "completion": 15.0,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 128000},
+    },
+    "command-r": {
+        "prompt": 0.5,
+        "completion": 1.5,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 128000},
+    },
+    "command": {
+        "prompt": 1.0,
+        "completion": 2.0,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 4096},
+    },
+    "command-nightly": {
+        "prompt": 1.0,
+        "completion": 2.0,
+        "token_limit": {"max_completion_tokens": 128000, "max_prompt_tokens": 128000},
+    },
+    "command-light": {
+        "prompt": 0.3,
+        "completion": 0.6,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 4096},
+    },
+    "command-light-nightly": {
+        "prompt": 0.3,
+        "completion": 0.6,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 4096},
+    },
+    "c4ai-aya-23": {
+        "prompt": 0.0,
+        "completion": 0.0,
+        "token_limit": {"max_completion_tokens": 8192, "max_prompt_tokens": 8192},
+    },
+    "rerank-english-v3.0": {
+        "prompt": 0,
+        "completion": 0,
+        # $ per 1K
+        "search": 2.0,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 4096},
+    },
+    "rerank-multilingual-v3.0": {
+        "prompt": 0,
+        "completion": 0,
+        # $ per 1K
+        "search": 2.0,
+        "token_limit": {"max_completion_tokens": 4096, "max_prompt_tokens": 4096},
+    },
+    "rerank-english-v2.0": {
+        "prompt": 0,
+        "completion": 0,
+        # $ per 1K
+        "search": 1.0,
+        "token_limit": {"max_completion_tokens": 512, "max_prompt_tokens": 512},
+    },
+    "rerank-multilingual-v2.0": {
+        "prompt": 0,
+        "completion": 0,
+        # $ per 1K
+        "search": 1.0,
+        "token_limit": {"max_completion_tokens": 512, "max_prompt_tokens": 512},
+    },
+}
+COHERE_SEARCH_MODELS: set[str] = {
+    "rerank-english-v3.0",
+    "rerank-multilingual-v3.0",
+    "rerank-english-v2.0",
+    "rerank-multilingual-v2.0",
+}
+ALL_NON_AZURE_MODELS_INFO = {**OPENAI_MODEL_INFO, **ANTHROPIC_MODEL_INFO, **COHERE_MODEL_INFO}
 
 NOUNS = (
     "abac",
diff --git a/parea/experiment/experiment.py b/parea/experiment/experiment.py
@@ -12,7 +12,6 @@
 
 from attrs import define, field
 from tqdm import tqdm
-from tqdm.asyncio import tqdm_asyncio
 
 from parea import Parea
 from parea.constants import PAREA_OS_ENV_EXPERIMENT_UUID
@@ -68,7 +67,7 @@ def apply_dataset_eval(dataset_level_evals: List[Callable]) -> List[EvaluationRe
         try:
             result = dataset_level_eval(root_traces)
         except Exception as e:
-            logger.exception(f"Error occurred calling dataset level eval function '{dataset_level_eval.__name__}': {e}", exc_info=e)
+            logger.error(f"Error occurred calling dataset level eval function '{dataset_level_eval.__name__}': {e}", exc_info=e)
             continue
         if result is None:
             continue
diff --git a/parea/utils/trace_utils.py b/parea/utils/trace_utils.py
@@ -245,7 +245,7 @@ def cleanup_trace(trace_id: str, start_time: datetime, context_token: contextvar
                     output = access_output_of_func(output)
                     output_for_eval_metrics = json_dumps(output)
                 except Exception as e:
-                    logger.exception(f"Error accessing output of func with output: {output}. Error: {e}", exc_info=e)
+                    logger.error(f"Error accessing output of func with output: {output}. Error: {e}", exc_info=e)
             trace_data.get()[trace_id].output_for_eval_metrics = output_for_eval_metrics
 
         thread_eval_funcs_then_log(trace_id, eval_funcs)
@@ -263,7 +263,7 @@ async def async_wrapper(*args, **kwargs):
                     fill_trace_data(trace_id, {"result": result, "output_as_list": output_as_list, "eval_funcs_names": eval_funcs_names}, UpdateTraceScenario.RESULT)
                 return result
             except Exception as e:
-                logger.exception(f"Error occurred in function {func.__name__}, {e}")
+                logger.error(f"Error occurred in function {func.__name__}, {e}")
                 fill_trace_data(trace_id, {"error": traceback.format_exc()}, UpdateTraceScenario.ERROR)
                 raise e
             finally:
@@ -283,7 +283,7 @@ def wrapper(*args, **kwargs):
                     fill_trace_data(trace_id, {"result": result, "output_as_list": output_as_list, "eval_funcs_names": eval_funcs_names}, UpdateTraceScenario.RESULT)
                 return result
             except Exception as e:
-                logger.exception(f"Error occurred in function {func.__name__}, {e}")
+                logger.error(f"Error occurred in function {func.__name__}, {e}")
                 fill_trace_data(trace_id, {"error": traceback.format_exc()}, UpdateTraceScenario.ERROR)
                 raise e
             finally:
@@ -326,7 +326,7 @@ def call_eval_funcs_then_log(trace_id: str, eval_funcs: List[Callable] = None):
                 elif score is not None:
                     scores.append(EvaluationResult(name=func.__name__, score=score))
             except Exception as e:
-                logger.exception(f"Error occurred calling evaluation function '{func.__name__}', {e}", exc_info=e)
+                logger.error(f"Error occurred calling evaluation function '{func.__name__}', {e}", exc_info=e)
         trace_data.get()[trace_id].scores = scores
         thread_ids_running_evals.get().remove(trace_id)
 
diff --git a/parea/wrapper/cohere/wrap_cohere.py b/parea/wrapper/cohere/wrap_cohere.py
diff --git a/parea/wrapper/openai_beta_wrapper.py b/parea/wrapper/openai_beta_wrapper.py
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml