demo-code

ysocarras-oracle · ysocarras-oracle · commit 18783655911a · 2025-04-22T16:41:40.000+02:00
diff --git a/ai/generative-ai-service/sentiment+categorization/README.md b/ai/generative-ai-service/sentiment+categorization/README.md
@@ -0,0 +1,2 @@
+> [!CAUTION]
+> Under construction.
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/app.py b/ai/generative-ai-service/sentiment+categorization/demo_code/app.py
@@ -0,0 +1,16 @@
+import streamlit as st
+
+st.set_page_config(
+    page_title="Hello",
+    page_icon="👋",
+)
+
+st.write("# Welcome to Streamlit! 👋")
+
+st.sidebar.success("Select a demo above.")
+
+st.markdown(
+    """
+This is a demo!
+"""
+)
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/data/complaints_messages.csv b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/data/complaints_messages.csv
@@ -0,0 +1,31 @@
+ID,Message
+1,I had to cancel my order because of poor service.
+2,"The delivery was late, and the packaging was damaged."
+3,I was sent the wrong color of the product.
+4,My order was incomplete when it arrived.
+5,The product I received was damaged.
+6,The quality of the product is much worse than expected.
+7,The product stopped working after a short period of time.
+8,The product doesn’t match the description on the website.
+9,I’ve had to contact customer service multiple times for the same issue.
+10,Customer support was not helpful at all.
+11,The quality of the product was poor.
+12,The product was much smaller than I expected.
+13,I had trouble finding the product on your website.
+14,The instructions were unclear and hard to follow.
+15,The website was difficult to navigate during my purchase.
+16,I received the wrong size and need a replacement.
+17,I was given false information about the product.
+18,The product stopped working after a short period of time.
+19,The product arrived damaged and unusable.
+20,The product arrived in terrible condition.
+21,The product arrived damaged and unusable.
+22,The customer service was slow to respond.
+23,The product was missing some essential accessories.
+24,I didn’t receive any confirmation email for my order.
+25,The product wasn’t compatible with my other appliances.
+26,The product is faulty and doesn’t work properly.
+27,The product didn’t fit as expected.
+28,The product was extremely hard to set up.
+29,I am unhappy with the design of the product.
+30,The website was difficult to navigate during my purchase.
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/feedback_agent.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/feedback_agent.py
@@ -0,0 +1,146 @@
+import json
+import logging
+from typing import List
+
+from langchain_community.chat_models.oci_generative_ai import ChatOCIGenAI
+from langchain_community.embeddings import OCIGenAIEmbeddings
+from langchain_core.messages import HumanMessage, SystemMessage
+from langchain_core.pydantic_v1 import BaseModel
+from langgraph.checkpoint.memory import MemorySaver
+from langgraph.graph import END, StateGraph
+
+import backend.message_handler as handler
+import backend.utils.llm_config as llm_config
+
+# Set up logging
+logging.getLogger("oci").setLevel(logging.DEBUG)
+messages_path = "ai/generative-ai-service/sentiment+categorization/demo_code/backend/data/complaints_messages.csv"
+
+
+class AgentState(BaseModel):
+    messages_info: List = []
+    categories: List = []
+    reports: List = []
+
+
+class FeedbackAgent:
+    def __init__(self, model_name: str = "cohere_oci"):
+        self.model_name = model_name
+        self.model = self.initialize_model()
+        self.memory = MemorySaver()
+        self.builder = self.setup_graph()
+        self.messages = self.read_messages()
+
+    def initialize_model(self):
+        if self.model_name not in llm_config.MODEL_REGISTRY:
+            raise ValueError(f"Unknown model: {self.model_name}")
+
+        model_config = llm_config.MODEL_REGISTRY[self.model_name]
+
+        return ChatOCIGenAI(
+            model_id=model_config["model_id"],
+            service_endpoint=model_config["service_endpoint"],
+            compartment_id=model_config["compartment_id"],
+            provider=model_config["provider"],
+            auth_type=model_config["auth_type"],
+            auth_profile=model_config["auth_profile"],
+            model_kwargs=model_config["model_kwargs"],
+        )
+
+    def initialize_embeddings(self):
+        if self.model_name not in llm_config.MODEL_REGISTRY:
+            raise ValueError(f"Unknown model: {self.model_name}")
+
+        model_config = llm_config.MODEL_REGISTRY[self.model_name]
+
+        embeddings = OCIGenAIEmbeddings(
+            model_id=model_config["embedding_model"],
+            service_endpoint=model_config["service_endpoint"],
+            truncate="NONE",
+            compartment_id=model_config["compartment_id"],
+            auth_type=model_config["auth_type"],
+            auth_profile=model_config["auth_profile"],
+        )
+        return embeddings
+
+    def read_messages(self):
+        messages = handler.read_messages(filepath=messages_path)
+        return handler.batchify(messages, 30)
+
+    def summarization_node(self, state: AgentState):
+        batch = self.messages
+        response = self.model.invoke(
+            [
+                SystemMessage(
+                    content=llm_config.get_prompt(self.model_name, "SUMMARIZATION")
+                ),
+                HumanMessage(content=f"Message batch: {batch}"),
+            ]
+        )
+        state.messages_info = state.messages_info + [json.loads(response.content)]
+        return {"messages_info": state.messages_info}
+
+    def categorization_node(self, state: AgentState):
+        batch = state.messages_info
+        response = self.model.invoke(
+            [
+                SystemMessage(
+                    content=llm_config.get_prompt(
+                        self.model_name, "CATEGORIZATION_SYSTEM"
+                    )
+                ),
+                HumanMessage(
+                    content=llm_config.get_prompt(
+                        self.model_name, "CATEGORIZATION_USER"
+                    ).format(MESSAGE_BATCH=batch)
+                ),
+            ]
+        )
+        content = [json.loads(response.content)]
+        state.categories = state.categories + handler.match_categories(batch, content)
+        return {"categories": state.categories}
+
+    def generate_report_node(self, state: AgentState):
+        response = self.model.invoke(
+            [
+                SystemMessage(
+                    content=llm_config.get_prompt(self.model_name, "REPORT_GEN")
+                ),
+                HumanMessage(content=f"Message info: {state.categories}"),
+            ]
+        )
+        state.reports = response.content
+        return {"reports": [response.content]}
+
+    def setup_graph(self):
+        builder = StateGraph(AgentState)
+        builder.add_node("summarize", self.summarization_node)
+        builder.add_node("categorize", self.categorization_node)
+        builder.add_node("generate_report", self.generate_report_node)
+
+        builder.set_entry_point("summarize")
+        builder.add_edge("summarize", "categorize")
+        builder.add_edge("categorize", "generate_report")
+
+        builder.add_edge("generate_report", END)
+        return builder.compile(checkpointer=self.memory)
+
+    def get_graph(self):
+        return self.builder.get_graph()
+
+    def run(self):
+        thread = {"configurable": {"thread_id": "1"}}
+        for s in self.builder.stream(
+            config=thread,
+        ):
+            print(f"\n \n{s}")
+
+    def run_step_by_step(self):
+        thread = {"configurable": {"thread_id": "1"}}
+        initial_state = {
+            "messages_info": [],
+            "categories": [],
+            "reports": [],
+        }
+        for state in self.builder.stream(initial_state, thread):
+            yield state  # Yield each intermediate step to allow step-by-step execution
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/feedback_wrapper.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/feedback_wrapper.py
@@ -0,0 +1,25 @@
+from backend.feedback_agent import FeedbackAgent
+
+
+class FeedbackAgentWrapper:
+    def __init__(self):
+        self.agent = FeedbackAgent()
+        self.run_graph = self.agent.run_step_by_step()
+
+    def get_nodes_edges(self):
+        graph_data = self.agent.get_graph()
+        nodes = list(graph_data.nodes.keys())
+        edges = [(edge.source, edge.target) for edge in graph_data.edges]
+        return nodes, edges
+
+    def run_step_by_step(self):
+        try:
+            action_output = next(self.run_graph)
+            current_node = list(action_output.keys())[0]
+        except StopIteration:
+            action_output = {}
+            current_node = "FINALIZED"
+        return current_node, action_output
+
+    def get_graph(self):
+        return self.agent.get_graph()
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/message_handler.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/message_handler.py
@@ -0,0 +1,53 @@
+import csv
+from typing import List
+
+
+def read_messages(
+    filepath: str, columns: List[str] = ["ID", "Message"]
+) -> List[List[str]]:
+    with open(filepath, newline="", encoding="utf-8") as file:
+        reader = csv.DictReader(file)
+        extracted_data = []
+
+        for row in reader:
+            extracted_row = [row[col] for col in columns if col in row]
+            extracted_data.append(extracted_row)
+
+    return extracted_data
+
+
+def batchify(lst, batch_size):
+    return [lst[i : i + batch_size] for i in range(0, len(lst), batch_size)]
+
+
+def match_categories(summaries, categories):
+    result = []
+    for i, elem in enumerate(summaries[0]):
+        if elem["id"] == categories[0][i]["id"]:
+            elem["primary_category"] = categories[0][i]["primary_category"]
+            elem["secondary_category"] = categories[0][i]["secondary_category"]
+            elem["tertiary_category"] = categories[0][i]["tertiary_category"]
+            result.append(elem)
+    return result
+
+
+def group_by_category_level(categories_list):
+    result = {}
+
+    for category in categories_list:
+        primary = category["primary_category"]
+        secondary = category["secondary_category"]
+        tertiary = category["tertiary_category"]
+
+        if primary not in result:
+            result[primary] = {}
+
+        if secondary not in result[primary]:
+            result[primary][secondary] = {}
+
+        if tertiary not in result[primary][secondary]:
+            result[primary][secondary][tertiary] = []
+
+        result[primary][secondary][tertiary].append(category["id"])
+
+    return result
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/config.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/config.py
@@ -0,0 +1,45 @@
+# config.py
+# Author: Ansh
+
+DB_TYPE = "qdrant"  # Options: "oracle", "qdrant"
+
+# OracleDB Configuration
+ORACLE_DB_USER = "ansh"  # Enter your oracle vector Db username
+ORACLE_DB_PWD = "Gena#######"  # Enter your oracle vector Db password
+ORACLE_DB_HOST_IP = "######"  # Enter your oracle vector Db host ip
+ORACLE_DB_PORT = 1521  # Enter your oracle vector Db host port
+ORACLE_DB_SERVICE = "orclpdb01.sub05101349370.bpivcnllm.oraclevcn.com"
+
+ORACLE_USERNAME = ORACLE_DB_USER
+ORACLE_PASSWORD = ORACLE_DB_PWD
+ORACLE_DSN = f"{ORACLE_DB_HOST_IP}:{ORACLE_DB_PORT}/{ORACLE_DB_SERVICE}"
+ORACLE_TABLE_NAME = (
+    "policyTable"  # name of table where you want to store the embeddings in oracle DB
+)
+
+# Qdrant Configuration
+QDRANT_LOCATION = ":memory:"
+QDRANT_COLLECTION_NAME = (
+    "my_documents"  # name of table where you want to store the embeddings in qdrant DB
+)
+QDRANT_DISTANCE_FUNC = "Dot"
+
+# Common Configuration
+USER_ID = ""
+COMPARTMENT_ID = "ocid1.compartment.oc1..XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
+OBJECT_STORAGE_LINK = "https://objectstorage.eu-frankfurt-1.oraclecloud.com/n/##############/b/##########/o/"
+DIRECTORY = "data"  # directory to store the pdf's from where the RAG model should take the documents from
+AUTH_TYPE = "API_KEY"
+CONFIG_PROFILE = "DEFAULT"
+PROMPT_CONTEXT = "You are an AI Assistant trained to give answers based only on the information provided. Given only the above text provided and not prior knowledge, answer the query. If someone asks you a question and you don't know the answer, don't try to make up a response, simply say: I don't know."
+ENDPOINT = "https://inference.generativeai.eu-frankfurt-1.oci.oraclecloud.com" #change in case you want to select a diff region
+
+# COHERE data
+PROVIDER_COHERE = "cohere"
+EMBEDDING_MODEL_COHERE = "cohere.embed-english-v3.0"
+GENERATE_MODEL_COHERE = "cohere.command-r-plus-08-2024"  # "ocid1.generativeaimodel.oc1.us-chicago-1.amaaaaaask7dceyanrlpnq5ybfu5hnzarg7jomak3q6kyhkzjsl4qj24fyoq"# cohere.command-r-16k or cohere.command-r-plus
+
+# LLAMA data
+PROVIDER_LLAMA = "meta"
+GENERATE_MODEL_LLAMA_33= "ocid1.generativeaimodel.oc1.eu-frankfurt-1.amaaaaaask7dceya4tdabclcsqbc3yj2mozvvqoq5ccmliv3354hfu3mx6bq"
+
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/llm_config.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/llm_config.py
@@ -0,0 +1,50 @@
+# import utils.config as config
+# from utils import prompts as prompts
+
+import backend.utils.config as config
+from backend.utils import prompts as prompts
+
+
+def get_prompt(model_name: str, prompt_type: str) -> str:
+    if model_name not in PROMPT_SETS:
+        raise ValueError(f"No prompts defined for model {model_name}")
+    if prompt_type not in PROMPT_SETS[model_name]:
+        raise ValueError(f"Unknown prompt type: {prompt_type}")
+    return PROMPT_SETS[model_name][prompt_type]
+
+
+MODEL_REGISTRY = {
+    "cohere_oci": {
+        "model_id": config.GENERATE_MODEL_COHERE,
+        "service_endpoint": config.ENDPOINT,
+        "compartment_id": config.COMPARTMENT_ID,
+        "provider": config.PROVIDER_COHERE,
+        "auth_type": config.AUTH_TYPE,
+        "auth_profile": config.CONFIG_PROFILE,
+        "model_kwargs": {"temperature": 0, "max_tokens": 4000},
+        "embedding_model": config.EMBEDDING_MODEL_COHERE,
+    },
+    "meta_oci": {
+        "model_id": config.GENERATE_MODEL_LLAMA_33,
+        "service_endpoint": config.ENDPOINT,
+        "compartment_id": config.COMPARTMENT_ID,
+        "provider": config.PROVIDER_LLAMA,
+        "auth_type": config.AUTH_TYPE,
+        "auth_profile": config.CONFIG_PROFILE,
+        "model_kwargs": {"temperature": 0, "max_tokens": 2000},
+    },
+}
+
+PROMPT_SETS = {
+    "cohere_oci": {
+        "SUMMARIZATION": prompts.SUMMARIZATION,
+        "CATEGORIZATION_SYSTEM": prompts.CATEGORIZATION_SYSTEM,
+        "CATEGORIZATION_USER": prompts.CATEGORIZATION_USER,
+        "REPORT_GEN": prompts.REPORT_GEN,
+    },
+    "meta_oci": {
+        "SUMMARIZATION_LLAMA": prompts.SUMMARIZATION_LLAMA,
+        "CATEGORIZATION_LLAMA": prompts.CATEGORIZATION_LLAMA,
+        "REPORT_GEN_LLAMA": prompts.REPORT_GEN_LLAMA,
+    },
+}
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/prompts.py b/ai/generative-ai-service/sentiment+categorization/demo_code/backend/utils/prompts.py
diff --git a/ai/generative-ai-service/sentiment+categorization/demo_code/pages/SentimentByCat.py b/ai/generative-ai-service/sentiment+categorization/demo_code/pages/SentimentByCat.py

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+> [!CAUTION]`
	`2`	`+> Under construction.`