zenml-io
diff --git a/‎llm-complete-guide/README.md‎
Lines changed: 2 additions & 8 deletions b/‎llm-complete-guide/README.md‎
Lines changed: 2 additions & 8 deletions
diff --git a/‎llm-complete-guide/configs/dev/rag.yaml‎
Lines changed: 0 additions & 1 deletion b/‎llm-complete-guide/configs/dev/rag.yaml‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎llm-complete-guide/constants.py‎
Lines changed: 5 additions & 3 deletions b/‎llm-complete-guide/constants.py‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎llm-complete-guide/deployment_hf.py‎
Lines changed: 37 additions & 6 deletions b/‎llm-complete-guide/deployment_hf.py‎
Lines changed: 37 additions & 6 deletions
diff --git a/‎llm-complete-guide/gh_action_rag.py‎
Lines changed: 6 additions & 8 deletions b/‎llm-complete-guide/gh_action_rag.py‎
Lines changed: 6 additions & 8 deletions
diff --git a/‎llm-complete-guide/pipelines/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎llm-complete-guide/pipelines/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎llm-complete-guide/pipelines/finetune_embeddings.py‎
Lines changed: 0 additions & 1 deletion b/‎llm-complete-guide/pipelines/finetune_embeddings.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎llm-complete-guide/pipelines/llm_basic_rag.py‎
Lines changed: 0 additions & 1 deletion b/‎llm-complete-guide/pipelines/llm_basic_rag.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎llm-complete-guide/pipelines/llm_index_and_evaluate.py‎
Lines changed: 2 additions & 1 deletion b/‎llm-complete-guide/pipelines/llm_index_and_evaluate.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎llm-complete-guide/requirements.txt‎
Lines changed: 2 additions & 1 deletion b/‎llm-complete-guide/requirements.txt‎
Lines changed: 2 additions & 1 deletion
@@ -100,7 +100,7 @@ use for the LLM.
 When you're ready to make the query, run the following command:
 
 ```shell
-python run.py query "how do I use a custom materializer inside my own zenml steps? i.e. how do I set it? inside the @step decorator?" --model=gpt4
+python run.py query --query-text "how do I use a custom materializer inside my own zenml steps? i.e. how do I set it? inside the @step decorator?" --model=gpt4
 ```
 
 Alternative options for LLMs to use include:
@@ -147,13 +147,7 @@ export ZENML_HF_SPACE_NAME=<YOUR_HF_SPACE_NAME> # optional, defaults to "llm-com
 To deploy the RAG pipeline, you can use the following command:
 
 ```shell
-python run.py --deploy
-```
-
-Alternatively, you can run the basic RAG pipeline *and* deploy it in one go:
-
-```shell
-python run.py --rag --deploy
+python run.py deploy
 ```
 
 This will open a Hugging Face space in your browser where you can interact with
 
@@ -1,6 +1,5 @@
 enable_cache: False
 
-# environment configuration
 settings:
   docker:
     requirements:
 
@@ -17,14 +17,16 @@
 import os
 
 # Vector Store constants
-CHUNK_SIZE = 2000
+CHUNK_SIZE = 1000
 CHUNK_OVERLAP = 50
 EMBEDDING_DIMENSIONALITY = (
     384  # Update this to match the dimensionality of the new model
 )
 
 # ZenML constants
 ZENML_CHATBOT_MODEL = "zenml-docs-qa-chatbot"
+ZENML_CHATBOT_MODEL_NAME = "zenml-docs-qa-chatbot"
+ZENML_CHATBOT_MODEL_VERSION = "0.71.0-dev"
 
 # Scraping constants
 RATE_LIMIT = 5  # Maximum number of requests per second
@@ -35,8 +37,8 @@
 MODEL_NAME_MAP = {
     "gpt4": "gpt-4",
     "gpt35": "gpt-3.5-turbo",
-    "claude3": "claude-3-opus-20240229",
-    "claudehaiku": "claude-3-haiku-20240307",
+    "claude3": "claude-3-5-sonnet-latest",
+    "claudehaiku": "claude-3-5-haiku-latest",
 }
 
 # CHUNKING_METHOD = "split-by-document"
 
@@ -1,13 +1,44 @@
+import logging
+
 import gradio as gr
+from constants import SECRET_NAME
 from utils.llm_utils import process_input_with_retrieval
+from zenml.client import Client
 
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 
-def predict(message, history):
-    return process_input_with_retrieval(
-        input=message,
-        n_items_retrieved=20,
-        use_reranking=True,
+# Initialize ZenML client and verify secret access
+try:
+    client = Client()
+    secret = client.get_secret(SECRET_NAME)
+    logger.info(
+        f"Successfully initialized ZenML client and found secret {SECRET_NAME}"
     )
+except Exception as e:
+    logger.error(f"Failed to initialize ZenML client or access secret: {e}")
+    raise RuntimeError(f"Application startup failed: {e}")
+
+
+def predict(message, history):
+    try:
+        return process_input_with_retrieval(
+            input=message,
+            n_items_retrieved=20,
+            use_reranking=True,
+        )
+    except Exception as e:
+        logger.error(f"Error processing message: {e}")
+        return f"Sorry, I encountered an error: {str(e)}"
+
 
+# Launch the Gradio interface
+interface = gr.ChatInterface(
+    predict,
+    title="ZenML Documentation Assistant",
+    description="Ask me anything about ZenML!",
+)
 
-gr.ChatInterface(predict, type="messages").launch()
+if __name__ == "__main__":
+    interface.launch(server_name="0.0.0.0", share=False)
@@ -21,12 +21,10 @@
 
 import click
 import yaml
-from zenml.enums import PluginSubType
-
 from pipelines.llm_index_and_evaluate import llm_index_and_evaluate
-from zenml.client import Client
 from zenml import Model
-from zenml.exceptions import ZenKeyError
+from zenml.client import Client
+from zenml.enums import PluginSubType
 
 
 @click.command(
@@ -89,7 +87,7 @@ def main(
     zenml_model_name: Optional[str] = "zenml-docs-qa-rag",
     zenml_model_version: Optional[str] = None,
 ):
-    """ 
+    """
     Executes the pipeline to train a basic RAG model.
 
     Args:
@@ -108,14 +106,14 @@ def main(
         config = yaml.safe_load(file)
 
     # Read the model version from a file in the root of the repo
-    #  called "ZENML_VERSION.txt". 
+    #  called "ZENML_VERSION.txt".
     if zenml_model_version == "staging":
         postfix = "-rc0"
     elif zenml_model_version == "production":
         postfix = ""
     else:
         postfix = "-dev"
-  
+
     if Path("ZENML_VERSION.txt").exists():
         with open("ZENML_VERSION.txt", "r") as file:
             zenml_model_version = file.read().strip()
@@ -177,7 +175,7 @@ def main(
                 service_account_id=service_account_id,
                 auth_window=0,
                 flavor="builtin",
-                action_type=PluginSubType.PIPELINE_RUN
+                action_type=PluginSubType.PIPELINE_RUN,
             ).id
             client.create_trigger(
                 name="Production Trigger LLM-Complete",
 
@@ -19,5 +19,5 @@
 from pipelines.generate_chunk_questions import generate_chunk_questions
 from pipelines.llm_basic_rag import llm_basic_rag
 from pipelines.llm_eval import llm_eval
+from pipelines.llm_index_and_evaluate import llm_index_and_evaluate
 from pipelines.rag_deployment import rag_deployment
-from pipelines.llm_index_and_evaluate import llm_index_and_evaluate
@@ -12,7 +12,6 @@
 #  or implied. See the License for the specific language governing
 #  permissions and limitations under the License.
 
-from constants import EMBEDDINGS_MODEL_NAME_ZENML
 from steps.finetune_embeddings import (
     evaluate_base_model,
     evaluate_finetuned_model,
 
@@ -14,7 +14,6 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-from litellm import config_path
 
 from steps.populate_index import (
     generate_embeddings,
 
@@ -15,9 +15,10 @@
 # limitations under the License.
 #
 
-from pipelines import llm_basic_rag, llm_eval
 from zenml import pipeline
 
+from pipelines import llm_basic_rag, llm_eval
+
 
 @pipeline
 def llm_index_and_evaluate() -> None:
 
@@ -1,4 +1,4 @@
-zenml[server]
+zenml[server]>=0.73.0
 ratelimit
 pgvector
 psycopg2-binary
@@ -21,6 +21,7 @@ torch
 gradio
 huggingface-hub
 elasticsearch
+tenacity
 
 # optional requirements for S3 artifact store
 # s3fs>2022.3.0
Original file line number	Diff line number	Diff line change
`@@ -14,7 +14,6 @@`
`14`	`14`	`# See the License for the specific language governing permissions and`
`15`	`15`	`# limitations under the License.`
`16`	`16`	`#`
`17`		`-from litellm import config_path`
`18`	`17`
`19`	`18`	`from steps.populate_index import (`
`20`	`19`	`generate_embeddings,`
Original file line number	Diff line number	Diff line change
`@@ -15,9 +15,10 @@`
`15`	`15`	`# limitations under the License.`
`16`	`16`	`#`
`17`	`17`
`18`		`-from pipelines import llm_basic_rag, llm_eval`
`19`	`18`	`from zenml import pipeline`
`20`	`19`
	`20`	`+from pipelines import llm_basic_rag, llm_eval`
	`21`	`+`
`21`	`22`
`22`	`23`	`@pipeline`
`23`	`24`	`def llm_index_and_evaluate() -> None:`