Scale3-Labs
diff --git a/‎.github/workflows/release.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/release.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md‎
Lines changed: 10 additions & 1 deletion b/‎README.md‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎pyproject.toml‎
Lines changed: 4 additions & 2 deletions b/‎pyproject.toml‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎src/examples/dspy_example/optimizers/bootstrap_fewshot.py‎
Lines changed: 89 additions & 0 deletions b/‎src/examples/dspy_example/optimizers/bootstrap_fewshot.py‎
Lines changed: 89 additions & 0 deletions
diff --git a/‎src/examples/litellm_example/basic.py‎
Lines changed: 1 addition & 5 deletions b/‎src/examples/litellm_example/basic.py‎
Lines changed: 1 addition & 5 deletions
diff --git a/‎src/examples/litellm_example/config.yaml‎
Lines changed: 10 additions & 0 deletions b/‎src/examples/litellm_example/config.yaml‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎src/examples/litellm_example/proxy_basic.py‎
Lines changed: 16 additions & 0 deletions b/‎src/examples/litellm_example/proxy_basic.py‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎src/examples/openai_example/chat_completion.py‎
Lines changed: 19 additions & 16 deletions b/‎src/examples/openai_example/chat_completion.py‎
Lines changed: 19 additions & 16 deletions
diff --git a/‎src/langtrace_python_sdk/constants/exporter/langtrace_exporter.py‎
Lines changed: 1 addition & 1 deletion b/‎src/langtrace_python_sdk/constants/exporter/langtrace_exporter.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/langtrace_python_sdk/constants/instrumentation/common.py‎
Lines changed: 1 addition & 0 deletions b/‎src/langtrace_python_sdk/constants/instrumentation/common.py‎
Lines changed: 1 addition & 0 deletions
@@ -65,7 +65,7 @@ jobs:
           hatch build
 
       - name: Publish Python 🐍 distributions 📦 to PyPI
-        uses: pypa/gh-action-pypi-publish@master
+        uses: pypa/gh-action-pypi-publish@release/v1
         with:
           password: ${{ secrets.PYPI_TOKEN }}
 
 
@@ -238,6 +238,14 @@ By default, prompt and completion data are captured. If you would like to opt ou
 
 `TRACE_PROMPT_COMPLETION_DATA=false`
 
+### Enable/Disable checkpoint tracing for DSPy
+
+By default, checkpoints are traced for DSPy pipelines. If you would like to disable it, set the following env var,
+
+`TRACE_DSPY_CHECKPOINT=false`
+
+Note: Checkpoint tracing will increase the latency of executions as the state is serialized. Please disable it in production.
+
 ## Supported integrations
 
 Langtrace automatically captures traces from the following vendors:
@@ -253,8 +261,9 @@ Langtrace automatically captures traces from the following vendors:
 | Gemini        | LLM             | :x:                | :white_check_mark:              |
 | Mistral       | LLM             | :x:                | :white_check_mark:              |
 | Langchain     | Framework       | :x:                | :white_check_mark:              |
-| LlamaIndex    | Framework       | :white_check_mark: | :white_check_mark:              |
 | Langgraph     | Framework       | :x:                | :white_check_mark:              |
+| LlamaIndex    | Framework       | :white_check_mark: | :white_check_mark:              |
+| LiteLLM       | Framework       | :x:                | :white_check_mark:              |
 | DSPy          | Framework       | :x:                | :white_check_mark:              |
 | CrewAI        | Framework       | :x:                | :white_check_mark:              |
 | Ollama        | Framework       | :x:                | :white_check_mark:              |
 
@@ -31,13 +31,14 @@ dependencies = [
   'fsspec>=2024.6.0',
   "transformers>=4.11.3",
   "sentry-sdk>=2.14.0",
+  "ujson>=5.10.0",
 ]
 
 requires-python = ">=3.9"
 
 [project.optional-dependencies]
 dev = [
-  "openai==1.30.1",
+  "openai==1.45.0",
   "anthropic",
   "chromadb",
   "qdrant-client",
@@ -46,7 +47,7 @@ dev = [
   "langchain",
   "langchain-community",
   "langchain-openai",
-  "langchain-openai",
+  "litellm==1.48.7",
   "chromadb",
   "cohere",
   "qdrant_client",
@@ -59,6 +60,7 @@ dev = [
   "embedchain",
   "psycopg",
   "pgvector"
+  "embedchain"
 ]
 
 test = ["pytest", "pytest-vcr", "pytest-asyncio"]
 
@@ -0,0 +1,89 @@
+import dspy
+from dotenv import find_dotenv, load_dotenv
+from dspy.datasets import HotPotQA
+from dspy.teleprompt import BootstrapFewShot
+
+from langtrace_python_sdk import inject_additional_attributes, langtrace
+
+_ = load_dotenv(find_dotenv())
+
+langtrace.init()
+
+turbo = dspy.LM('openai/gpt-4o-mini')
+colbertv2_wiki17_abstracts = dspy.ColBERTv2(url='http://20.102.90.50:2017/wiki17_abstracts')
+
+dspy.settings.configure(lm=turbo, rm=colbertv2_wiki17_abstracts)
+
+
+# Load the dataset.
+dataset = HotPotQA(train_seed=1, train_size=20, eval_seed=2023, dev_size=50, test_size=0)
+
+# Tell DSPy that the 'question' field is the input. Any other fields are labels and/or metadata.
+trainset = [x.with_inputs('question') for x in dataset.train]
+devset = [x.with_inputs('question') for x in dataset.dev]
+
+
+class GenerateAnswer(dspy.Signature):
+    """Answer questions with short factoid answers."""
+
+    context = dspy.InputField(desc="may contain relevant facts")
+    question = dspy.InputField()
+    answer = dspy.OutputField(desc="often between 1 and 5 words")
+
+
+class RAG(dspy.Module):
+    def __init__(self, num_passages=3):
+        super().__init__()
+
+        self.retrieve = dspy.Retrieve(k=num_passages)
+        self.generate_answer = dspy.ChainOfThought(GenerateAnswer)
+
+    def forward(self, question):
+        context = self.retrieve(question).passages
+        prediction = self.generate_answer(context=context, question=question)
+        return dspy.Prediction(context=context, answer=prediction.answer)
+
+
+# Validation logic: check that the predicted answer is correct.
+# Also check that the retrieved context does actually contain that answer.
+def validate_context_and_answer(example, prediction, trace=None):
+    answer_em = dspy.evaluate.answer_exact_match(example, prediction)
+    answer_pm = dspy.evaluate.answer_passage_match(example, prediction)
+    return answer_em and answer_pm
+
+
+# Set up a basic optimizer, which will compile our RAG program.
+optimizer = BootstrapFewShot(metric=validate_context_and_answer)
+
+# Compile!
+compiled_rag = optimizer.compile(RAG(), trainset=trainset)
+
+# Ask any question you like to this simple RAG program.
+my_question = "Who was the hero of the movie peraanmai?"
+
+# Get the prediction. This contains `pred.context` and `pred.answer`.
+# pred = compiled_rag(my_question)
+pred = inject_additional_attributes(lambda: compiled_rag(my_question), {'experiment': 'experiment 6', 'description': 'trying additional stuff', 'run_id': 'run_1'})
+# compiled_rag.save('compiled_rag_v1.json')
+
+# Print the contexts and the answer.
+print(f"Question: {my_question}")
+print(f"Predicted Answer: {pred.answer}")
+print(f"Retrieved Contexts (truncated): {[c[:200] + '...' for c in pred.context]}")
+
+# print("Inspecting the history of the optimizer:")
+# turbo.inspect_history(n=1)
+
+from dspy.evaluate import Evaluate
+
+
+def validate_answer(example, pred, trace=None):
+    return True
+
+
+# Set up the evaluator, which can be used multiple times.
+evaluate = Evaluate(devset=devset, metric=validate_answer, num_threads=4, display_progress=True, display_table=0)
+
+
+# Evaluate our `optimized_cot` program.
+evaluate(compiled_rag)
@@ -1,4 +1,3 @@
-from langtrace_python_sdk import with_langtrace_root_span, langtrace
 from dotenv import load_dotenv
 from litellm import completion, acompletion
 import litellm
@@ -8,11 +7,9 @@
 
 
 litellm.success_callback = ["langtrace"]
-langtrace.init()
 litellm.set_verbose = False
 
 
-@with_langtrace_root_span("Litellm Example OpenAI")
 def openAI(streaming=False):
     response = completion(
         model="gpt-3.5-turbo",
@@ -56,7 +53,6 @@ def anthropic(streaming=False):
         print("ERORRRR", e)
 
 
-# @with_langtrace_root_span("Litellm Example OpenAI Async Streaming")
 async def async_anthropic(streaming=False):
     response = await acompletion(
         model="claude-2.1",
@@ -93,6 +89,6 @@ def cohere(streaming=False):
 
 if __name__ == "__main__":
     # openAI()
-    anthropic(streaming=False)
+    # anthropic(streaming=False)
     cohere(streaming=True)
     # asyncio.run(async_anthropic(streaming=True))
@@ -0,0 +1,10 @@
+model_list:
+  - model_name: "gpt-4" # all requests where model not in your config go to this deployment
+    litellm_params:
+      model: openai/gpt-4 # set `openai/` to use the openai route
+
+litellm_settings:
+  success_callback: ["langtrace"]
+
+environment_variables:
+  LANGTRACE_API_KEY: "fake-api-key"
@@ -0,0 +1,16 @@
+import openai
+from dotenv import load_dotenv
+
+load_dotenv()
+
+client = openai.OpenAI(base_url="http://0.0.0.0:4000")
+
+# request sent to model set on litellm proxy, `litellm --model`
+response = client.chat.completions.create(
+    model="gpt-4",
+    messages=[
+        {"role": "user", "content": "this is a test request, write a short poem"}
+    ],
+)
+
+print(response)
@@ -9,19 +9,19 @@
 
 _ = load_dotenv(find_dotenv())
 
-langtrace.init(write_spans_to_console=True)
+langtrace.init()
 client = OpenAI()
 
 
 def api():
     response = client.chat.completions.create(
-        model="gpt-4",
+        model="o1-mini",
         messages=[
-            {"role": "system", "content": "Talk like a pirate"},
-            {"role": "user", "content": "Tell me a story in 3 sentences or less."},
+            # {"role": "system", "content": "Talk like a pirate"},
+            {"role": "user", "content": "How many r's are in strawberry?"},
         ],
-        stream=True,
-        # stream=False,
+        # stream=True,
+        stream=False,
     )
     return response
 
@@ -31,14 +31,17 @@ def chat_completion():
     response = api()
     # print(response)
     # Uncomment this for streaming
-    result = []
-    for chunk in response:
-        if chunk.choices[0].delta.content is not None:
-            content = [
-                choice.delta.content if choice.delta and choice.delta.content else ""
-                for choice in chunk.choices
-            ]
-            result.append(content[0] if len(content) > 0 else "")
-
-    # print("".join(result))
+    # result = []
+    # for chunk in response:
+    #     if chunk.choices[0].delta.content is not None:
+    #         content = [
+    #             choice.delta.content if choice.delta and choice.delta.content else ""
+    #             for choice in chunk.choices
+    #         ]
+    #         result.append(content[0] if len(content) > 0 else "")
+
+    # # print("".join(result))
+    print(response)
     return response
+
+chat_completion()
@@ -1 +1 @@
-LANGTRACE_REMOTE_URL = "https://langtrace.ai"
+LANGTRACE_REMOTE_URL = "https://app.langtrace.ai"
@@ -19,6 +19,7 @@
     "LANGCHAIN_COMMUNITY": "Langchain Community",
     "LANGCHAIN_CORE": "Langchain Core",
     "LANGGRAPH": "Langgraph",
+    "LITELLM": "Litellm",
     "LLAMAINDEX": "LlamaIndex",
     "OPENAI": "OpenAI",
     "PINECONE": "Pinecone",
Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-LANGTRACE_REMOTE_URL = "https://langtrace.ai"`
	`1`	`+LANGTRACE_REMOTE_URL = "https://app.langtrace.ai"`