GraphScope
diff --git a/‎python/graphy/apps/demo_app.py‎
Lines changed: 107 additions & 0 deletions b/‎python/graphy/apps/demo_app.py‎
Lines changed: 107 additions & 0 deletions
diff --git a/‎python/graphy/apps/graph_analyzer.py‎
Lines changed: 77 additions & 0 deletions b/‎python/graphy/apps/graph_analyzer.py‎
Lines changed: 77 additions & 0 deletions
@@ -12,6 +12,7 @@
 from db import JsonFileStore
 from graph.nodes.chain_node import BaseChainNode
 from apps.text_generator import ReportGenerator
+from apps.graph_analyzer import LLMGraphAnalyzer
 from models import set_llm_model, DefaultEmbedding, DEFAULT_LLM_MODEL_CONFIG
 
 from threading import Thread
@@ -128,6 +129,7 @@ def __init__(
         self.llm_report()
 
         self.text_generator = ReportGenerator(self.llm.model)
+        self.graph_analyzer = LLMGraphAnalyzer(self.llm.model)
 
     def get_persist_store(self, dataset_id):
         persist_store = self.persist_stores.setdefault(
@@ -1228,6 +1230,111 @@ def do_summarizing():
                 traceback.print_exc()
                 return create_error_response(str(e)), 500
 
+        @self.app.route("/api/llm/analyze/fetch", methods=["POST"])
+        def fetch_query():
+            try:
+                # Extract the JSON payload
+                input_data = request.get_json()
+                required_fields = [
+                    "query",
+                    "schema",
+                ]
+                for field in required_fields:
+                    if field not in input_data:
+                        return (
+                            create_error_response(f"Missing {field} in request"),
+                            400,
+                        )
+
+                query = input_data["query"]
+                schema = input_data["schema"]
+                lang = input_data.get("lang", "cypher")
+
+                output_prompt = self.graph_analyzer.get_fetch_query(
+                    query=query, schema=schema, lang=lang
+                )
+
+                # Return success response
+                return (
+                    create_json_response({"prompts": output_prompt}),
+                    200,
+                )
+
+            except Exception as e:
+                traceback.print_exc()
+                return create_error_response(str(e)), 500
+
+        @self.app.route("/api/llm/analyze/mindmap", methods=["POST"])
+        def get_mind_map():
+            try:
+                # Extract the JSON payload
+                input_data = request.get_json()
+                required_fields = [
+                    "query",
+                    "data",
+                ]
+                for field in required_fields:
+                    if field not in input_data:
+                        return (
+                            create_error_response(f"Missing {field} in request"),
+                            400,
+                        )
+
+                query = input_data["query"]
+                data = input_data["data"]
+
+                output_json = self.graph_analyzer.get_mind_map(query=query, data=data)
+
+                # Return success response
+                return (
+                    create_json_response({"mind_map": output_json}),
+                    200,
+                )
+
+            except Exception as e:
+                traceback.print_exc()
+                return create_error_response(str(e)), 500
+
+        @self.app.route("/api/llm/analyze/writereport", methods=["POST"])
+        def get_report():
+            try:
+                # Extract the JSON payload
+                input_data = request.get_json()
+                required_fields = [
+                    "query",
+                    "mind_map",
+                ]
+                for field in required_fields:
+                    if field not in input_data:
+                        return (
+                            create_error_response(f"Missing {field} in request"),
+                            400,
+                        )
+
+                query = input_data["query"]
+                mind_map = input_data["mind_map"]
+                max_token_per_subsection = input_data.get(
+                    "max_token_per_subsection", 100
+                )
+                bib2id = input_data.get("bib2id", {})
+
+                output_text = self.graph_analyzer.write_report_sec_by_sec(
+                    query=query,
+                    mind_map=mind_map,
+                    max_token_per_subsection=max_token_per_subsection,
+                    bib2id=bib2id,
+                )
+
+                # Return success response
+                return (
+                    create_json_response({"text": output_text}),
+                    200,
+                )
+
+            except Exception as e:
+                traceback.print_exc()
+                return create_error_response(str(e)), 500
+
         @self.app.route("/api/llm/report/prepare", methods=["POST"])
         def prepare_report():
             try:
 
@@ -17,6 +17,11 @@
     TEMPLATE_QUERY_GENERATOR,
     TEMPLATE_MIND_MAP_GENERATOR,
     TEMPLATE_RELATED_WORK_GENERATOR,
+    TEMPLATE_RELATED_WORK_INTRO_GENERATOR,
+    TEMPLATE_RELATED_WORK_TEXT_PROMPT,
+    TEMPLATE_TEXT_EXAMPLE_PROMPT,
+    TEMPLATE_SUBSECTION_INSTRUCTION_PROMPT,
+    TEMPLATE_PREVIOUS_SUBSECITON_PROMPT,
 )
 
 logger = logging.getLogger()
@@ -93,6 +98,78 @@ def write_report(self, query, mind_map, max_token_per_subsection):
 
         return result
 
+    def generate_section_texts(self, query, mind_map, max_token_per_subsection):
+        section_prompts = []
+
+        subsection_id = 0
+        for category in mind_map.get("data", []):
+            subsection_id += 1
+            prop_slot = str(category)
+
+            generated_instruction = ""
+            if subsection_id == 1:
+                generated_instruction += TEMPLATE_TEXT_EXAMPLE_PROMPT
+
+            generated_instruction += TEMPLATE_SUBSECTION_INSTRUCTION_PROMPT.format(
+                subsection_id=str(subsection_id),
+                max_token_per_subsection=str(max_token_per_subsection),
+            )
+
+            if subsection_id > 1:
+                generated_instruction += TEMPLATE_PREVIOUS_SUBSECITON_PROMPT
+
+            paper_memories = TEMPLATE_RELATED_WORK_TEXT_PROMPT.format(
+                user_query=query,
+                prop_slot=prop_slot,
+                generate_instruction=generated_instruction,
+            )
+
+            section_prompts.append(paper_memories)
+
+        return section_prompts
+
+    def write_report_sec_by_sec(
+        self, query, mind_map, max_token_per_subsection, bib2id={}
+    ):
+        prop_slot = ""
+        for category in mind_map.get("data", []):
+            if len(prop_slot) > 0:
+                prop_slot += ","
+            name = category.get("name", "")
+            description = category.get("description", "")
+            prop_slot += json.dumps({"name": name, "description": description})
+
+        intro_prompt = TEMPLATE_RELATED_WORK_INTRO_GENERATOR.format(prop_slot=prop_slot)
+        intro_text = self.generate("get_report_intro", intro_prompt)
+
+        # print("########## INTRO PROMPT ###############")
+        # print(intro_prompt)
+
+        section_prompts = self.generate_section_texts(
+            query=query,
+            mind_map=mind_map,
+            max_token_per_subsection=max_token_per_subsection,
+        )
+
+        # for sec in section_prompts:
+        #     print("########## SECTION PROMPT ###############")
+        #     print(sec)
+
+        section_text = ""
+        for i in range(len(section_prompts)):
+            text_prompt = section_prompts[i]
+            if "<PREVIOUS></PREVIOUS>" in text_prompt:
+                text_prompt = text_prompt.replace("<PREVIOUS></PREVIOUS>", section_text)
+            new_section_text = self.generate("query_report_text", text_prompt)
+            section_text += "\n" + new_section_text + "\n"
+
+        final_section = intro_text + "\n" + section_text
+        bib_text = self.append_bib_text(final_section, bib2id)
+
+        final_section += bib_text
+
+        return final_section
+
     def append_bib_text(self, text, id2bib):
         bib_text = ""
         cited_papers = set()