Merge pull request #111 from cohere-ai/misc-updates

mrmer1 · web-flow · commit e471d9122f5d · 2024-01-30T15:56:27.000+08:00
Update Chat &amp; RAG Part 3
diff --git a/notebooks/RAG_Chatbot_with_Chat_Embed_Rerank.ipynb b/notebooks/RAG_Chatbot_with_Chat_Embed_Rerank.ipynb
@@ -74,15 +74,16 @@
    "outputs": [],
    "source": [
     "import cohere\n",
-    "import os\n",
     "import hnswlib\n",
     "import json\n",
     "import uuid\n",
     "from typing import List, Dict\n",
     "from unstructured.partition.html import partition_html\n",
     "from unstructured.chunking.title import chunk_by_title\n",
     "\n",
-    "co = cohere.Client(os.environ[\"COHERE_API_KEY\"])"
+    "# co = cohere.Client(\"COHERE_API_KEY\")\n",
+    "import os\n",
+    "co = cohere.Client(os.getenv(\"COHERE_API_KEY\"))"
    ]
   },
   {
@@ -274,7 +275,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 19,
    "metadata": {},
    "outputs": [
     {
@@ -336,24 +337,29 @@
     "        response = co.chat(message=message, search_queries_only=True)\n",
     "\n",
     "        # If there are search queries, retrieve documents and respond\n",
+    "        # preamble_override = \"You only answer questions using on the documents you have provided with\"\n",
+    "        \n",
     "        if response.search_queries:\n",
     "            print(\"Retrieving information...\")\n",
     "\n",
     "            documents = self.retrieve_docs(response)\n",
     "\n",
     "            response = co.chat(\n",
     "                message=message,\n",
+    "                # preamble_override = preamble_override,\n",
     "                documents=documents,\n",
     "                conversation_id=self.conversation_id,\n",
     "                stream=True,\n",
     "            )\n",
     "            for event in response:\n",
     "                yield event\n",
+    "            yield response\n",
     "\n",
     "        # If there is no search query, directly respond\n",
     "        else:\n",
     "            response = co.chat(\n",
-    "                message=message, \n",
+    "                message=message,\n",
+    "                # preamble_override = preamble_override,\n",
     "                conversation_id=self.conversation_id, \n",
     "                stream=True\n",
     "            )\n",
@@ -381,12 +387,6 @@
     "        for query in queries:\n",
     "            retrieved_docs.extend(self.docs.retrieve(query))\n",
     "\n",
-    "        # # Uncomment this code block to display the chatbot's retrieved documents\n",
-    "        # print(\"DOCUMENTS RETRIEVED:\")\n",
-    "        # for idx, doc in enumerate(retrieved_docs):\n",
-    "        #     print(f\"doc_{idx}: {doc}\")\n",
-    "        # print(\"\\n\")\n",
-    "\n",
     "        return retrieved_docs"
    ]
   },
@@ -400,7 +400,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
@@ -455,18 +455,29 @@
     "\n",
     "            # Print the chatbot response\n",
     "            print(\"Chatbot:\")\n",
-    "            flag = False\n",
+    "            \n",
+    "            citations_flag = False\n",
+    "            \n",
     "            for event in response:\n",
-    "                # Text\n",
-    "                if event.event_type == \"text-generation\":\n",
+    "                stream_type = type(event).__name__\n",
+    "                    # Text\n",
+    "                if stream_type == \"StreamTextGeneration\":\n",
     "                    print(event.text, end=\"\")\n",
     "\n",
     "                # Citations\n",
-    "                if event.event_type == \"citation-generation\":\n",
-    "                    if not flag:\n",
+    "                if stream_type == \"StreamCitationGeneration\":\n",
+    "                    if not citations_flag:\n",
     "                        print(\"\\n\\nCITATIONS:\")\n",
-    "                        flag = True\n",
-    "                    print(event.citations)\n",
+    "                        citations_flag = True\n",
+    "                    print(event.citations[0])\n",
+    "                    \n",
+    "                if citations_flag:\n",
+    "                    if stream_type == \"StreamingChat\":\n",
+    "                        print(\"\\n\\nDOCUMENTS:\")\n",
+    "                        documents = [{'id': doc['id'], 'text': doc['text'][:50] + '...', 'title': doc['title'], 'url': doc['url']} \n",
+    "                                     for doc in event.documents]\n",
+    "                        for doc in documents:\n",
+    "                            print(doc)\n",
     "\n",
     "            print(f\"\\n{'-'*100}\\n\")"
    ]
@@ -534,7 +545,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
@@ -581,7 +592,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 27,
    "metadata": {},
    "outputs": [
     {
@@ -606,69 +617,69 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "User: Hi there\n",
+      "User: Hello, I have a question\n",
       "Chatbot:\n",
-      "Hi there! I'm Coral, an AI-assistant chatbot trained to assist human users by providing thorough responses. Is there anything I can help you with today?\n",
+      "Hello there! I'm happy to help with any questions or discussions you have in mind today. Go ahead and ask away, and I'll do my best to provide helpful, informative responses.\n",
       "----------------------------------------------------------------------------------------------------\n",
       "\n",
-      "User: What are text embeddings\n",
+      "User: What’s the difference between word and sentence embeddings\n",
       "Chatbot:\n",
       "Retrieving information...\n",
-      "Text embeddings are used to convert words into numbers, creating a vector of numerical data for every piece of text. If the vectors for two pieces of text are similar, this means that the corresponding pieces of text are similar too, and vice versa. Text embeddings are particularly useful for tasks like machine translation and searching for text in different languages. \n",
+      "Word embeddings and sentence embeddings are both responsible for translating human language (words) into computer language (numbers).\n",
       "\n",
-      "Would you like me to go into more detail about any of the information mentioned above?\n",
+      "Word embeddings associate words with lists of numbers (vectors) in a way that similar words are grouped close together. Sentence embeddings do the same thing but for sentences, where similar sentences are grouped closer together.\n",
       "\n",
       "CITATIONS:\n",
-      "[{'start': 28, 'end': 54, 'text': 'convert words into numbers', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 67, 'end': 116, 'text': 'vector of numerical data for every piece of text.', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 136, 'end': 166, 'text': 'two pieces of text are similar', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 188, 'end': 249, 'text': 'corresponding pieces of text are similar too, and vice versa.', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 305, 'end': 324, 'text': 'machine translation', 'document_ids': ['doc_2']}]\n",
-      "[{'start': 329, 'end': 371, 'text': 'searching for text in different languages.', 'document_ids': ['doc_2']}]\n",
+      "{'start': 0, 'end': 15, 'text': 'Word embeddings', 'document_ids': ['doc_0', 'doc_1', 'doc_2']}\n",
+      "{'start': 20, 'end': 39, 'text': 'sentence embeddings', 'document_ids': ['doc_0', 'doc_1', 'doc_2']}\n",
+      "{'start': 65, 'end': 132, 'text': 'translating human language (words) into computer language (numbers)', 'document_ids': ['doc_2']}\n",
+      "{'start': 135, 'end': 254, 'text': 'Word embeddings associate words with lists of numbers (vectors) in a way that similar words are grouped close together.', 'document_ids': ['doc_0']}\n",
+      "{'start': 255, 'end': 310, 'text': 'Sentence embeddings do the same thing but for sentences', 'document_ids': ['doc_0', 'doc_1']}\n",
+      "{'start': 318, 'end': 364, 'text': 'similar sentences are grouped closer together.', 'document_ids': ['doc_1']}\n",
+      "\n",
+      "\n",
+      "DOCUMENTS:\n",
+      "{'id': 'doc_0', 'text': 'In the previous chapters, you learned about word a...', 'title': 'The Attention Mechanism', 'url': 'https://docs.cohere.com/docs/the-attention-mechanism'}\n",
+      "{'id': 'doc_1', 'text': 'This is where sentence embeddings come into play. ...', 'title': 'Text Embeddings', 'url': 'https://docs.cohere.com/docs/text-embeddings'}\n",
+      "{'id': 'doc_2', 'text': 'Conclusion\\n\\nWord and sentence embeddings are the b...', 'title': 'Text Embeddings', 'url': 'https://docs.cohere.com/docs/text-embeddings'}\n",
       "\n",
       "----------------------------------------------------------------------------------------------------\n",
       "\n",
-      "User: What are they useful for\n",
+      "User: And what are their similarities\n",
       "Chatbot:\n",
       "Retrieving information...\n",
-      "Text embeddings are useful for a variety of tasks, including:\n",
+      "The similarities between word and sentence embeddings are that they both rely on vector representations of numerical values, and they both allow for calculations of similarity. Word embeddings focus on the similarity between individual words, whereas sentence embeddings compare entire sentences. \n",
       "\n",
-      "- Machine learning - for example, transformer models can be used to write stories, essays and poems, as well as answer questions and chat with humans.\n",
-      "- Machine translation - text embeddings can translate text from one language to another.\n",
-      "- Searching for text - text embeddings can be used to find text in any language. \n",
-      "\n",
-      "Would you like me to go into more detail about any of the tasks text embeddings are useful for?\n",
+      "The similarities between sentences can be calculated using cosine similarity, which is also the case for word embeddings. The similarity between each sentence and itself is always the highest (around 8000 for cosine similarity), while the similarity between different sentences is much lower.\n",
       "\n",
       "CITATIONS:\n",
-      "[{'start': 65, 'end': 81, 'text': 'Machine learning', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 97, 'end': 115, 'text': 'transformer models', 'document_ids': ['doc_0', 'doc_1']}]\n",
-      "[{'start': 131, 'end': 144, 'text': 'write stories', 'document_ids': ['doc_0', 'doc_1']}]\n",
-      "[{'start': 146, 'end': 152, 'text': 'essays', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 157, 'end': 162, 'text': 'poems', 'document_ids': ['doc_0', 'doc_1']}]\n",
-      "[{'start': 175, 'end': 191, 'text': 'answer questions', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 196, 'end': 213, 'text': 'chat with humans.', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 216, 'end': 235, 'text': 'Machine translation', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 258, 'end': 302, 'text': 'translate text from one language to another.', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 305, 'end': 323, 'text': 'Searching for text', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 370, 'end': 383, 'text': 'any language.', 'document_ids': ['doc_1']}]\n",
+      "{'start': 73, 'end': 123, 'text': 'rely on vector representations of numerical values', 'document_ids': ['doc_2']}\n",
+      "{'start': 134, 'end': 176, 'text': 'both allow for calculations of similarity.', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4', 'doc_5']}\n",
+      "{'start': 177, 'end': 241, 'text': 'Word embeddings focus on the similarity between individual words', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4', 'doc_5']}\n",
+      "{'start': 251, 'end': 296, 'text': 'sentence embeddings compare entire sentences.', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4', 'doc_5']}\n",
+      "{'start': 303, 'end': 375, 'text': 'similarities between sentences can be calculated using cosine similarity', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4', 'doc_5']}\n",
+      "{'start': 404, 'end': 420, 'text': 'word embeddings.', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4', 'doc_5']}\n",
+      "{'start': 425, 'end': 490, 'text': 'similarity between each sentence and itself is always the highest', 'document_ids': ['doc_5']}\n",
+      "{'start': 491, 'end': 526, 'text': '(around 8000 for cosine similarity)', 'document_ids': ['doc_1', 'doc_3', 'doc_5']}\n",
+      "{'start': 538, 'end': 591, 'text': 'similarity between different sentences is much lower.', 'document_ids': ['doc_0', 'doc_1', 'doc_3', 'doc_4']}\n",
+      "\n",
+      "\n",
+      "DOCUMENTS:\n",
+      "{'id': 'doc_2', 'text': 'One would expect the two first sentences to have a...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
+      "{'id': 'doc_0', 'text': 'And the results are:\\n\\nThe similarity between sente...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
+      "{'id': 'doc_1', 'text': 'This checks out as well! The similarity between se...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
+      "{'id': 'doc_3', 'text': 'This checks out as well! The similarity between se...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
+      "{'id': 'doc_4', 'text': 'And the results are:\\n\\nThe similarity between sente...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
+      "{'id': 'doc_5', 'text': 'Just for consistency, let’s calculate the similari...', 'title': 'Similarity Between Words and Sentences', 'url': 'https://docs.cohere.com/docs/similarity-between-words-and-sentences'}\n",
       "\n",
       "----------------------------------------------------------------------------------------------------\n",
       "\n",
-      "User: How do you generate them\n",
+      "User: What do you know about graph neural networks\n",
       "Chatbot:\n",
       "Retrieving information...\n",
-      "Text embeddings are generated by training transformer models on large datasets, such as the entire internet or large datasets of conversations. Post-training helps improve the model's performance on specific tasks by focusing on datasets corresponding to questions and answers or conversations. \n",
-      "\n",
-      "Would you like me to go into more detail about transformer models?\n",
-      "\n",
-      "CITATIONS:\n",
-      "[{'start': 42, 'end': 60, 'text': 'transformer models', 'document_ids': ['doc_0', 'doc_1', 'doc_2']}]\n",
-      "[{'start': 92, 'end': 107, 'text': 'entire internet', 'document_ids': ['doc_0']}]\n",
-      "[{'start': 129, 'end': 143, 'text': 'conversations.', 'document_ids': ['doc_1']}]\n",
-      "[{'start': 144, 'end': 195, 'text': \"Post-training helps improve the model's performance\", 'document_ids': ['doc_0', 'doc_1']}]\n",
-      "[{'start': 255, 'end': 276, 'text': 'questions and answers', 'document_ids': ['doc_0']}]\n",
-      "[{'start': 280, 'end': 294, 'text': 'conversations.', 'document_ids': ['doc_1']}]\n",
+      "Graph neural networks are a newer concept in the world of neural networks. Using graph neural networks, programmers can develop models that analyze datasets comprised of pairs of entities and edges between those entities. These edges convey relationships between the entities, such as a connection between two entities or a similarity between entities. \n",
       "\n",
+      "To construct graph neural networks, programmers use node embedding, a process that assigns a vector to each node in the graph. The vectors are designed so that their underlying information is preserved when compared to the original graph.\n",
       "----------------------------------------------------------------------------------------------------\n",
       "\n",
       "Ending chat.\n"