microsoft
diff --git a/‎Python/CosmosDB-MongoDB-vCore/CosmosDB-MongoDB-vCore_AzureOpenAI_Tutorial.ipynb‎
Lines changed: 142 additions & 61 deletions b/‎Python/CosmosDB-MongoDB-vCore/CosmosDB-MongoDB-vCore_AzureOpenAI_Tutorial.ipynb‎
Lines changed: 142 additions & 61 deletions
@@ -30,8 +30,7 @@
     "! pip install pymongo\n",
     "! pip install python-dotenv\n",
     "! pip install azure-core\n",
-    "! pip install azure-cosmos\n",
-    "! pip install tenacity"
+    "! pip install azure-cosmos"
    ]
   },
   {
@@ -43,14 +42,14 @@
     "import json\n",
     "import datetime\n",
     "import time\n",
+    "import urllib \n",
     "\n",
     "from azure.core.exceptions import AzureError\n",
     "from azure.core.credentials import AzureKeyCredential\n",
     "import pymongo\n",
     "\n",
-    "import openai\n",
-    "from dotenv import load_dotenv\n",
-    "from tenacity import retry, wait_random_exponential, stop_after_attempt"
+    "from openai import AzureOpenAI\n",
+    "from dotenv import load_dotenv"
    ]
   },
   {
@@ -73,25 +72,18 @@
     "env_name = \"example.env\" # following example.env template change to your own .env file name\n",
     "config = dotenv_values(env_name)\n",
     "\n",
-    "cosmosdb_endpoint = config['cosmos_db_api_endpoint']\n",
-    "cosmosdb_key = config['cosmos_db_api_key']\n",
-    "cosmosdb_connection_str = config['cosmos_db_connection_string']\n",
-    "\n",
     "COSMOS_MONGO_USER = config['cosmos_db_mongo_user']\n",
     "COSMOS_MONGO_PWD = config['cosmos_db_mongo_pwd']\n",
     "COSMOS_MONGO_SERVER = config['cosmos_db_mongo_server']\n",
     "\n",
-    "openai.api_type = config['openai_api_type']\n",
-    "openai.api_key = config['openai_api_key']\n",
-    "openai.api_base = config['openai_api_endpoint']\n",
-    "openai.api_version = config['openai_api_version']\n",
-    "embeddings_deployment = config['openai_embeddings_deployment']\n",
-    "completions_deployment = config['openai_completions_deployment']"
+    "AOAI_client = AzureOpenAI(api_key=config['openai_api_key'], azure_endpoint=config['openai_api_endpoint'], api_version=config['openai_api_version'],)"
    ]
   },
   {
    "cell_type": "markdown",
-   "metadata": {},
+   "metadata": {
+    "jp-MarkdownHeadingCollapsed": true
+   },
    "source": [
     "## Create an Azure Cosmos DB for MongoDB vCore resource<a class=\"anchor\" id=\"cosmosdb\"></a>\n",
     "Let's start by creating an Azure Cosmos DB for MongoDB vCore Resource following this quick start guide: https://learn.microsoft.com/en-us/azure/cosmos-db/mongodb/vcore/quickstart-portal\n",
@@ -128,11 +120,12 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Load text-sample.json data file. Embeddings will need to be generated using the function below.\n",
-    "#data_file = open(file=\"../../DataSet/AzureServices/text-sample.json\", mode=\"r\")\n",
-    "\n",
-    "# OR Load text-sample_w_embeddings.json which has embeddings pre-computed\n",
+    "# Load text-sample_w_embeddings.json which has embeddings pre-computed\n",
     "data_file = open(file=\"../../DataSet/AzureServices/text-sample_w_embeddings.json\", mode=\"r\") \n",
+    "\n",
+    "# OR Load text-sample.json data file. Embeddings will need to be generated using the function below.\n",
+    "# data_file = open(file=\"../../DataSet/AzureServices/text-sample.json\", mode=\"r\")\n",
+    "\n",
     "data = json.load(data_file)\n",
     "data_file.close()"
    ]
@@ -155,17 +148,15 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "@retry(wait=wait_random_exponential(min=1, max=20), stop=stop_after_attempt(10))\n",
     "def generate_embeddings(text):\n",
     "    '''\n",
     "    Generate embeddings from string of text.\n",
     "    This will be used to vectorize data and user input for interactions with Azure OpenAI.\n",
     "    '''\n",
-    "    response = openai.Embedding.create(\n",
-    "        input=text, engine=\"text-embedding-ada-002\")\n",
-    "    embeddings = response['data'][0]['embedding']\n",
-    "    time.sleep(0.5) # rest period to avoid rate limiting on AOAI for free tier\n",
-    "    return embeddings"
+    "    response = AOAI_client.embeddings.create(input=text, model=config['openai_embeddings_deployment'])\n",
+    "    embeddings =response.model_dump()\n",
+    "    time.sleep(0.5) \n",
+    "    return embeddings['data'][0]['embedding']"
    ]
   },
   {
@@ -191,6 +182,16 @@
     "    json.dump(data, f)"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Take a peek at one data item with embeddings created\n",
+    "print(json.dumps(data[0], indent=2))"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -211,7 +212,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "mongo_conn = \"mongodb+srv://\"+COSMOS_MONGO_USER+\":\"+COSMOS_MONGO_PWD+\"@\"+COSMOS_MONGO_SERVER+\"?tls=true&authMechanism=SCRAM-SHA-256&retrywrites=false&maxIdleTimeMS=120000\"\n",
+    "mongo_conn = \"mongodb+srv://\"+urllib.parse.quote(COSMOS_MONGO_USER)+\":\"+urllib.parse.quote(COSMOS_MONGO_PWD)+\"@\"+COSMOS_MONGO_SERVER+\"?tls=true&authMechanism=SCRAM-SHA-256&retrywrites=false&maxIdleTimeMS=120000\"\n",
     "mongo_client = pymongo.MongoClient(mongo_conn)"
    ]
   },
@@ -250,8 +251,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "## Use only if re-reunning code and want to reset db and collection\n",
-    "collection.drop_index(\"VectorSearchIndex\")\n",
+    "# Use only if re-reunning code and want to reset db and collection\n",
+    "collection.drop_indexes()\n",
     "mongo_client.drop_database(\"ExampleDB\")"
    ]
   },
@@ -268,8 +269,10 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "### IVF\n",
-    "IVF is the default vector indexing algorithm, which works on all cluster tiers. It's an approximate nerarest neighbors (ANN) approach that uses clustering to speeding up the search for similar vectors in a dataset. "
+    "### IVF index\n",
+    "IVF is an approximate nerarest neighbors (ANN) approach that uses clustering to speed up the search for similar vectors in a dataset. It's a good choice for proof-of-concepts and smaller datasets (under a few thousand documents). However it's not recommended to use at scale or when higher throughput is needed.\n",
+    "\n",
+    "IVF is supported on all cluster tiers, including the free tier. "
    ]
   },
   {
@@ -301,11 +304,9 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "### HNSW (preview)\n",
-    "\n",
-    "HNSW stands for Hierarchical Navigable Small World, a graph-based data structure that partitions vectors into clusters and subclusters. With HNSW, you can perform fast approximate nearest neighbor search at higher speeds with greater accuracy. HNSW is an approximate (ANN) method. As a preview feature, this must be enabled using Azure Feature Enablement Control (AFEC) by selecting the \"mongoHnswIndex\" feature. For more information, see [enable preview features](https://learn.microsoft.com/azure/azure-resource-manager/management/preview-features).\n",
+    "### HNSW Index\n",
     "\n",
-    "HNSW works on M50 cluster tiers and higher while in preview."
+    "HNSW stands for Hierarchical Navigable Small World, a graph-based index that partitions vectors into clusters and subclusters. With HNSW, you can perform fast approximate nearest neighbor search at higher speeds with greater accuracy.  HNSW is now available on M40 and higher cluster tiers."
    ]
   },
   {
@@ -314,8 +315,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "db.command(\n",
-    "{ \n",
+    "db.command({ \n",
     "    \"createIndexes\": \"ExampleCollection\",\n",
     "    \"indexes\": [\n",
     "        {\n",
@@ -367,7 +367,7 @@
    "outputs": [],
    "source": [
     "# Simple function to assist with vector search\n",
-    "def vector_search(query, num_results=3):\n",
+    "def vector_search(query, num_results=5):\n",
     "    query_embedding = generate_embeddings(query)\n",
     "    embeddings_list = []\n",
     "    pipeline = [\n",
@@ -376,7 +376,8 @@
     "                \"cosmosSearch\": {\n",
     "                    \"vector\": query_embedding,\n",
     "                    \"path\": \"contentVector\",\n",
-    "                    \"k\": num_results #, \"efsearch\": 40 # optional for HNSW only \n",
+    "                    \"k\": num_results#, #, \"efsearch\": 40 # optional for HNSW only \n",
+    "                    #\"filter\": {\"title\": {\"$ne\": \"Azure Cosmos DB\"}}\n",
     "                },\n",
     "                \"returnStoredSource\": True }},\n",
     "        {'$project': { 'similarityScore': { '$meta': 'searchScore' }, 'document' : '$$ROOT' } }\n",
@@ -400,7 +401,7 @@
    },
    "outputs": [],
    "source": [
-    "query = \"What are the services for running ML models?\"\n",
+    "query = \"What are some NoSQL databases in Azure?\"#\"What are the services for running ML models?\"\n",
     "results = vector_search(query)\n",
     "for result in results: \n",
     "#     print(result)\n",
@@ -410,6 +411,89 @@
     "    print(f\"Category: {result['document']['category']}\\n\")  "
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Filtered vector search (Preview)\n",
+    "You can add additional query filters to your vector search by creating a filtered index and specifying it in the search pipeline.\n",
+    "\n",
+    "**Note:** filtered vector search preview and needs to be enabled via Azure Preview Features for your subscription. Search for the preview feature \"filtering on vector search\". Learn more about it here: https://learn.microsoft.com/azure/azure-resource-manager/management/preview-features?tabs=azure-portal"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Add a filter index\n",
+    "db.command( {\n",
+    "    \"createIndexes\": \"ExampleCollection\",\n",
+    "    \"indexes\": [ {\n",
+    "        \"key\": { \n",
+    "            \"title\": 1 \n",
+    "               }, \n",
+    "        \"name\": \"title_filter\" \n",
+    "    }\n",
+    "    ] \n",
+    "} \n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Verify all indexes are present\n",
+    "for i in collection.list_indexes():\n",
+    "    print(i)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Simple function to assist with vector search\n",
+    "def filtered_vector_search(query, num_results=5):\n",
+    "    query_embedding = generate_embeddings(query)\n",
+    "    embeddings_list = []\n",
+    "    pipeline = [\n",
+    "        {\n",
+    "            '$search': {\n",
+    "                \"cosmosSearch\": {\n",
+    "                    \"vector\": query_embedding,\n",
+    "                    \"path\": \"contentVector\",\n",
+    "                    \"k\": num_results,\n",
+    "                    \"filter\": {\"title\": {\"$nin\": [\"Azure SQL Database\", \"Azure Database for MySQL\"]}}\n",
+    "                },\n",
+    "                \"returnStoredSource\": True }},\n",
+    "        {'$project': { 'similarityScore': { '$meta': 'searchScore' }, 'document' : '$$ROOT' } }\n",
+    "    ]\n",
+    "    results = collection.aggregate(pipeline)\n",
+    "    return results"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "query = \"What are some NoSQL databases in Azure?\"#\"What are the services for running ML models?\"\n",
+    "results = filtered_vector_search(query)\n",
+    "for result in results: \n",
+    "#     print(result)\n",
+    "    print(f\"Similarity Score: {result['similarityScore']}\")  \n",
+    "    print(f\"Title: {result['document']['title']}\")  \n",
+    "    print(f\"Content: {result['document']['content']}\")  \n",
+    "    print(f\"Category: {result['document']['category']}\\n\")  "
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -427,47 +511,44 @@
    "source": [
     "#This function helps to ground the model with prompts and system instructions.\n",
     "\n",
-    "def generate_completion(prompt):\n",
+    "def generate_completion(vector_search_results, user_prompt):\n",
     "    system_prompt = '''\n",
     "    You are an intelligent assistant for Microsoft Azure services.\n",
     "    You are designed to provide helpful answers to user questions about Azure services given the information about to be provided.\n",
-    "        - Only answer questions related to the information provided below, provide 3 clear suggestions in a list format.\n",
+    "        - Only answer questions related to the information provided below, provide at least 3 clear suggestions in a list format.\n",
     "        - Write two lines of whitespace between each answer in the list.\n",
-    "        - Only provide answers that have products that are part of Microsoft Azure.\n",
     "        - If you're unsure of an answer, you can say \"\"I don't know\"\" or \"\"I'm not sure\"\" and recommend users search themselves.\"\n",
+    "        - Only provide answers that have products that are part of Microsoft Azure and part of these following prompts.\n",
     "    '''\n",
     "\n",
-    "    messages=[\n",
-    "        {\"role\": \"system\", \"content\": system_prompt},\n",
-    "        {\"role\": \"user\", \"content\": user_input},\n",
-    "    ]\n",
-    "\n",
-    "    for item in results:\n",
-    "        messages.append({\"role\": \"system\", \"content\": prompt['content']})\n",
-    "\n",
-    "    response = openai.ChatCompletion.create(engine=completions_deployment, messages=messages)\n",
+    "    messages=[{\"role\": \"system\", \"content\": system_prompt}]\n",
+    "    for item in vector_search_results:\n",
+    "        messages.append({\"role\": \"system\", \"content\": item['document']['content']})\n",
+    "    messages.append({\"role\": \"user\", \"content\": user_prompt})\n",
+    "    response = AOAI_client.chat.completions.create(model=config['openai_completions_deployment'], messages=messages,temperature=0)\n",
     "    \n",
-    "    return response"
+    "    return response.dict()"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "scrolled": true
+   },
    "outputs": [],
    "source": [
     "# Create a loop of user input and model output. You can now perform Q&A over the sample data!\n",
     "\n",
     "user_input = \"\"\n",
     "print(\"*** Please ask your model questions about Azure services. Type 'end' to end the session.\\n\")\n",
-    "user_input = input(\"Prompt: \")\n",
+    "user_input = input(\"User prompt: \")\n",
     "while user_input.lower() != \"end\":\n",
-    "    results_for_prompt = vector_search(user_input)\n",
-    "   # print(f\"User Prompt: {user_input}\")\n",
-    "    completions_results = generate_completion(results_for_prompt)\n",
+    "    search_results = vector_search(user_input)\n",
+    "    completions_results = generate_completion(search_results, user_input)\n",
     "    print(\"\\n\")\n",
     "    print(completions_results['choices'][0]['message']['content'])\n",
-    "    user_input = input(\"Prompt: \")\n"
+    "    user_input = input(\"User prompt: \")"
    ]
   }
  ],
@@ -487,7 +568,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.7"
+   "version": "3.11.0"
   },
   "varInspector": {
    "cols": {
@@ -520,5 +601,5 @@
   }
  },
  "nbformat": 4,
- "nbformat_minor": 2
+ "nbformat_minor": 4
 }