diff --git a/docs/langchain-retrieval-augmentation.ipynb b/docs/langchain-retrieval-augmentation.ipynb
index 3b5317ad..c483e470 100644
--- a/docs/langchain-retrieval-augmentation.ipynb
+++ b/docs/langchain-retrieval-augmentation.ipynb
@@ -182,7 +182,7 @@
"text": [
"Document content: Released [`v2.2.0`](https://github.com/pinecone-io/go-pinecone/releases/tag/v2.2.0) of the [Pinecone Go SDK](/reference/go-sdk). This version adds support for [index tags](/guides/manage-data/manage-indexes#configure-index-tags) when creating or configuring indexes.\n",
"\n",
- "Document metadata: {'release': '2025 releases', 'month_year': 'January 2025', 'feature': 'Released Go SDK v2.2.0', 'source': 'https://docs.pinecone.io/release-notes/2025.md', 'chunk_num': 47}\n"
+ "Document metadata: {'release': '2025 releases', 'month_year': 'January 2025', 'feature': 'Released Go SDK v2.2.0', 'source': 'https://docs.pinecone.io/release-notes/2025.md', 'chunk_num': 61}\n"
]
}
],
@@ -313,16 +313,7 @@
"cell_type": "code",
"execution_count": 9,
"metadata": {},
- "outputs": [
- {
- "name": "stderr",
- "output_type": "stream",
- "text": [
- "/opt/miniconda3/envs/pinecone-examples/lib/python3.11/site-packages/pinecone/data/index.py:1: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
- " from tqdm.autonotebook import tqdm\n"
- ]
- }
- ],
+ "outputs": [],
"source": [
"from pinecone import Pinecone\n",
"\n",
@@ -394,7 +385,7 @@
},
{
"cell_type": "code",
- "execution_count": 17,
+ "execution_count": 11,
"metadata": {},
"outputs": [
{
@@ -599,242 +590,310 @@
" 'source': 'https://docs.pinecone.io/release-notes/2024.md',\n",
" 'chunk_num': 41},\n",
" {'release': '2025 releases',\n",
- " 'month_year': 'June 2025',\n",
+ " 'month_year': 'August 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
" 'chunk_num': 0},\n",
" {'release': '2025 releases',\n",
+ " 'month_year': 'August 2025',\n",
+ " 'feature': 'Data import from Azure Blob Storage',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 1},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'August 2025',\n",
+ " 'feature': 'Assistant MCP server endpoint update',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 2},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'August 2025',\n",
+ " 'feature': 'VoltAgent integration',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 3},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'July 2025',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 4},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'July 2025',\n",
+ " 'feature': 'Increased context window for `pinecone-sparse-english-v0`',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 5},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'July 2025',\n",
+ " 'feature': 'Release Go SDK v4.1.0, v4.1.1, and v4.1.2',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 6},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'July 2025',\n",
+ " 'feature': 'Release Node.js SDK v6.1.2',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 7},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 8},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Unlimited assistant file storage for paid plans',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 9},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Data import from Google Cloud Storage',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 10},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Released Python SDK v7.1.0, v7.2.0, and v7.3.0',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 11},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Released Go SDK v4.0.0 and v4.0.1',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 12},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Released Node.js SDK v6.1.1',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 13},\n",
+ " {'release': '2025 releases',\n",
+ " 'month_year': 'June 2025',\n",
+ " 'feature': 'Data modeling guide',\n",
+ " 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
+ " 'chunk_num': 14},\n",
+ " {'release': '2025 releases',\n",
" 'month_year': 'June 2025',\n",
" 'feature': 'Released Java SDK v5.1.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 1},\n",
+ " 'chunk_num': 15},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'June 2025',\n",
" 'feature': 'Released Node.js SDK v6.1.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 2},\n",
+ " 'chunk_num': 16},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 3},\n",
+ " 'chunk_num': 17},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released Python SDK v7.0.1 and v7.0.2',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 4},\n",
+ " 'chunk_num': 18},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released Node.s SDK v6.0.1',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 5},\n",
+ " 'chunk_num': 19},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Pinecone API version `2025-04` is now the latest stable version',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 6},\n",
+ " 'chunk_num': 20},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released Python SDK v7.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 7},\n",
+ " 'chunk_num': 21},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released Node.js SDK v6.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 8},\n",
+ " 'chunk_num': 22},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released Java SDK v5.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 9},\n",
+ " 'chunk_num': 23},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'Released .NET SDK v4.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 10},\n",
+ " 'chunk_num': 24},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'May 2025',\n",
" 'feature': 'New Docs IA',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 11},\n",
+ " 'chunk_num': 25},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 12},\n",
+ " 'chunk_num': 26},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Bring Your Own Cloud (BYOC) in GCP',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 13},\n",
+ " 'chunk_num': 27},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Integrate AI agents with Pinecone MCP',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 14},\n",
+ " 'chunk_num': 28},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Add context to AI agents with Assistant MCP',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 15},\n",
+ " 'chunk_num': 29},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Upload a file from an in-memory binary stream',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 16},\n",
+ " 'chunk_num': 30},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Released Pinecone Terraform Provider v1.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 17},\n",
+ " 'chunk_num': 31},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'Released .NET SDK v3.1.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 18},\n",
+ " 'chunk_num': 32},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'April 2025',\n",
" 'feature': 'LLM shortcuts for Pinecone docs',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 19},\n",
+ " 'chunk_num': 33},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 20},\n",
+ " 'chunk_num': 34},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Control the context snippets the assistant sends to the LLM',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 21},\n",
+ " 'chunk_num': 35},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Released Go SDK v3.1.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 22},\n",
+ " 'chunk_num': 36},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Launch week: Dark mode',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 23},\n",
+ " 'chunk_num': 37},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Launch week: Self-service audit logs',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 24},\n",
+ " 'chunk_num': 38},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Launch week: Introducing the Admin API and service accounts',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 25},\n",
+ " 'chunk_num': 39},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Launch week: Back up an index through the API',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 26},\n",
+ " 'chunk_num': 40},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Launch week: Optimized database architecture',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 27},\n",
+ " 'chunk_num': 41},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Firebase Genkit integration',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 28},\n",
+ " 'chunk_num': 42},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'March 2025',\n",
" 'feature': 'Bring Your Own Cloud (BYOC) in public preview',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 29},\n",
+ " 'chunk_num': 43},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 30},\n",
+ " 'chunk_num': 44},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Docs site refresh',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 31},\n",
+ " 'chunk_num': 45},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Limit the number of chunks retrieved',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 32},\n",
+ " 'chunk_num': 46},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Assistant Quickstart colab notebook',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 33},\n",
+ " 'chunk_num': 47},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Released Node.js SDK v5.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 34},\n",
+ " 'chunk_num': 48},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'New integrations',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 35},\n",
+ " 'chunk_num': 49},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Citation highlights in assistant responses',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 36},\n",
+ " 'chunk_num': 50},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Pinecone API version `2025-01` is now the latest stable version',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 37},\n",
+ " 'chunk_num': 51},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Released Python SDK v6.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 38},\n",
+ " 'chunk_num': 52},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Released Java SDK v4.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 39},\n",
+ " 'chunk_num': 53},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Released Go SDK v3.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 40},\n",
+ " 'chunk_num': 54},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'February 2025',\n",
" 'feature': 'Released .NET SDK v3.0.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 41},\n",
+ " 'chunk_num': 55},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 42},\n",
+ " 'chunk_num': 56},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'feature': 'Update to the API keys page',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 43},\n",
+ " 'chunk_num': 57},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'feature': 'Sparse-only indexes in early access',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 44},\n",
+ " 'chunk_num': 58},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'feature': 'Released Node SDK v4.1.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 45},\n",
+ " 'chunk_num': 59},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'feature': 'New Billing Admin user role',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 46},\n",
+ " 'chunk_num': 60},\n",
" {'release': '2025 releases',\n",
" 'month_year': 'January 2025',\n",
" 'feature': 'Released Go SDK v2.2.0',\n",
" 'source': 'https://docs.pinecone.io/release-notes/2025.md',\n",
- " 'chunk_num': 47}]"
+ " 'chunk_num': 61}]"
]
},
- "execution_count": 17,
+ "execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
@@ -845,7 +904,7 @@
},
{
"cell_type": "code",
- "execution_count": 19,
+ "execution_count": null,
"metadata": {},
"outputs": [
{
@@ -894,56 +953,70 @@
" 'release_2024#feature_na#chunk_num40',\n",
" 'release_2024#feature_na#chunk_num41',\n",
" 'release_2025#feature_na#chunk_num0',\n",
- " 'release_2025#feature_Released Java SDK v5.1.0#chunk_num1',\n",
- " 'release_2025#feature_Released Node.js SDK v6.1.0#chunk_num2',\n",
- " 'release_2025#feature_na#chunk_num3',\n",
- " 'release_2025#feature_Released Python SDK v7.0.1 and v7.0.2#chunk_num4',\n",
- " 'release_2025#feature_Released Node.s SDK v6.0.1#chunk_num5',\n",
- " 'release_2025#feature_Pinecone API version `2025-04` is now the latest stable version#chunk_num6',\n",
- " 'release_2025#feature_Released Python SDK v7.0.0#chunk_num7',\n",
- " 'release_2025#feature_Released Node.js SDK v6.0.0#chunk_num8',\n",
- " 'release_2025#feature_Released Java SDK v5.0.0#chunk_num9',\n",
- " 'release_2025#feature_Released .NET SDK v4.0.0#chunk_num10',\n",
- " 'release_2025#feature_New Docs IA#chunk_num11',\n",
- " 'release_2025#feature_na#chunk_num12',\n",
- " 'release_2025#feature_Bring Your Own Cloud (BYOC) in GCP#chunk_num13',\n",
- " 'release_2025#feature_Integrate AI agents with Pinecone MCP#chunk_num14',\n",
- " 'release_2025#feature_Add context to AI agents with Assistant MCP#chunk_num15',\n",
- " 'release_2025#feature_Upload a file from an in-memory binary stream#chunk_num16',\n",
- " 'release_2025#feature_Released Pinecone Terraform Provider v1.0.0#chunk_num17',\n",
- " 'release_2025#feature_Released .NET SDK v3.1.0#chunk_num18',\n",
- " 'release_2025#feature_LLM shortcuts for Pinecone docs#chunk_num19',\n",
- " 'release_2025#feature_na#chunk_num20',\n",
- " 'release_2025#feature_Control the context snippets the assistant sends to the LLM#chunk_num21',\n",
- " 'release_2025#feature_Released Go SDK v3.1.0#chunk_num22',\n",
- " 'release_2025#feature_Launch week: Dark mode#chunk_num23',\n",
- " 'release_2025#feature_Launch week: Self-service audit logs#chunk_num24',\n",
- " 'release_2025#feature_Launch week: Introducing the Admin API and service accounts#chunk_num25',\n",
- " 'release_2025#feature_Launch week: Back up an index through the API#chunk_num26',\n",
- " 'release_2025#feature_Launch week: Optimized database architecture#chunk_num27',\n",
- " 'release_2025#feature_Firebase Genkit integration#chunk_num28',\n",
- " 'release_2025#feature_Bring Your Own Cloud (BYOC) in public preview#chunk_num29',\n",
- " 'release_2025#feature_na#chunk_num30',\n",
- " 'release_2025#feature_Docs site refresh#chunk_num31',\n",
- " 'release_2025#feature_Limit the number of chunks retrieved#chunk_num32',\n",
- " 'release_2025#feature_Assistant Quickstart colab notebook#chunk_num33',\n",
- " 'release_2025#feature_Released Node.js SDK v5.0.0#chunk_num34',\n",
- " 'release_2025#feature_New integrations#chunk_num35',\n",
- " 'release_2025#feature_Citation highlights in assistant responses#chunk_num36',\n",
- " 'release_2025#feature_Pinecone API version `2025-01` is now the latest stable version#chunk_num37',\n",
- " 'release_2025#feature_Released Python SDK v6.0.0#chunk_num38',\n",
- " 'release_2025#feature_Released Java SDK v4.0.0#chunk_num39',\n",
- " 'release_2025#feature_Released Go SDK v3.0.0#chunk_num40',\n",
- " 'release_2025#feature_Released .NET SDK v3.0.0#chunk_num41',\n",
- " 'release_2025#feature_na#chunk_num42',\n",
- " 'release_2025#feature_Update to the API keys page#chunk_num43',\n",
- " 'release_2025#feature_Sparse-only indexes in early access#chunk_num44',\n",
- " 'release_2025#feature_Released Node SDK v4.1.0#chunk_num45',\n",
- " 'release_2025#feature_New Billing Admin user role#chunk_num46',\n",
- " 'release_2025#feature_Released Go SDK v2.2.0#chunk_num47']"
+ " 'release_2025#feature_Data import from Azure Blob Storage#chunk_num1',\n",
+ " 'release_2025#feature_Assistant MCP server endpoint update#chunk_num2',\n",
+ " 'release_2025#feature_VoltAgent integration#chunk_num3',\n",
+ " 'release_2025#feature_na#chunk_num4',\n",
+ " 'release_2025#feature_Increased context window for `pinecone-sparse-english-v0`#chunk_num5',\n",
+ " 'release_2025#feature_Release Go SDK v4.1.0, v4.1.1, and v4.1.2#chunk_num6',\n",
+ " 'release_2025#feature_Release Node.js SDK v6.1.2#chunk_num7',\n",
+ " 'release_2025#feature_na#chunk_num8',\n",
+ " 'release_2025#feature_Unlimited assistant file storage for paid plans#chunk_num9',\n",
+ " 'release_2025#feature_Data import from Google Cloud Storage#chunk_num10',\n",
+ " 'release_2025#feature_Released Python SDK v7.1.0, v7.2.0, and v7.3.0#chunk_num11',\n",
+ " 'release_2025#feature_Released Go SDK v4.0.0 and v4.0.1#chunk_num12',\n",
+ " 'release_2025#feature_Released Node.js SDK v6.1.1#chunk_num13',\n",
+ " 'release_2025#feature_Data modeling guide#chunk_num14',\n",
+ " 'release_2025#feature_Released Java SDK v5.1.0#chunk_num15',\n",
+ " 'release_2025#feature_Released Node.js SDK v6.1.0#chunk_num16',\n",
+ " 'release_2025#feature_na#chunk_num17',\n",
+ " 'release_2025#feature_Released Python SDK v7.0.1 and v7.0.2#chunk_num18',\n",
+ " 'release_2025#feature_Released Node.s SDK v6.0.1#chunk_num19',\n",
+ " 'release_2025#feature_Pinecone API version `2025-04` is now the latest stable version#chunk_num20',\n",
+ " 'release_2025#feature_Released Python SDK v7.0.0#chunk_num21',\n",
+ " 'release_2025#feature_Released Node.js SDK v6.0.0#chunk_num22',\n",
+ " 'release_2025#feature_Released Java SDK v5.0.0#chunk_num23',\n",
+ " 'release_2025#feature_Released .NET SDK v4.0.0#chunk_num24',\n",
+ " 'release_2025#feature_New Docs IA#chunk_num25',\n",
+ " 'release_2025#feature_na#chunk_num26',\n",
+ " 'release_2025#feature_Bring Your Own Cloud (BYOC) in GCP#chunk_num27',\n",
+ " 'release_2025#feature_Integrate AI agents with Pinecone MCP#chunk_num28',\n",
+ " 'release_2025#feature_Add context to AI agents with Assistant MCP#chunk_num29',\n",
+ " 'release_2025#feature_Upload a file from an in-memory binary stream#chunk_num30',\n",
+ " 'release_2025#feature_Released Pinecone Terraform Provider v1.0.0#chunk_num31',\n",
+ " 'release_2025#feature_Released .NET SDK v3.1.0#chunk_num32',\n",
+ " 'release_2025#feature_LLM shortcuts for Pinecone docs#chunk_num33',\n",
+ " 'release_2025#feature_na#chunk_num34',\n",
+ " 'release_2025#feature_Control the context snippets the assistant sends to the LLM#chunk_num35',\n",
+ " 'release_2025#feature_Released Go SDK v3.1.0#chunk_num36',\n",
+ " 'release_2025#feature_Launch week: Dark mode#chunk_num37',\n",
+ " 'release_2025#feature_Launch week: Self-service audit logs#chunk_num38',\n",
+ " 'release_2025#feature_Launch week: Introducing the Admin API and service accounts#chunk_num39',\n",
+ " 'release_2025#feature_Launch week: Back up an index through the API#chunk_num40',\n",
+ " 'release_2025#feature_Launch week: Optimized database architecture#chunk_num41',\n",
+ " 'release_2025#feature_Firebase Genkit integration#chunk_num42',\n",
+ " 'release_2025#feature_Bring Your Own Cloud (BYOC) in public preview#chunk_num43',\n",
+ " 'release_2025#feature_na#chunk_num44',\n",
+ " 'release_2025#feature_Docs site refresh#chunk_num45',\n",
+ " 'release_2025#feature_Limit the number of chunks retrieved#chunk_num46',\n",
+ " 'release_2025#feature_Assistant Quickstart colab notebook#chunk_num47',\n",
+ " 'release_2025#feature_Released Node.js SDK v5.0.0#chunk_num48',\n",
+ " 'release_2025#feature_New integrations#chunk_num49',\n",
+ " 'release_2025#feature_Citation highlights in assistant responses#chunk_num50',\n",
+ " 'release_2025#feature_Pinecone API version `2025-01` is now the latest stable version#chunk_num51',\n",
+ " 'release_2025#feature_Released Python SDK v6.0.0#chunk_num52',\n",
+ " 'release_2025#feature_Released Java SDK v4.0.0#chunk_num53',\n",
+ " 'release_2025#feature_Released Go SDK v3.0.0#chunk_num54',\n",
+ " 'release_2025#feature_Released .NET SDK v3.0.0#chunk_num55',\n",
+ " 'release_2025#feature_na#chunk_num56',\n",
+ " 'release_2025#feature_Update to the API keys page#chunk_num57',\n",
+ " 'release_2025#feature_Sparse-only indexes in early access#chunk_num58',\n",
+ " 'release_2025#feature_Released Node SDK v4.1.0#chunk_num59',\n",
+ " 'release_2025#feature_New Billing Admin user role#chunk_num60',\n",
+ " 'release_2025#feature_Released Go SDK v2.2.0#chunk_num61']"
]
},
- "execution_count": 19,
+ "execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
@@ -976,7 +1049,7 @@
"ids = [generate_ids(doc) for doc in pinecone_docs]\n",
"\n",
"\n",
- "# To learn more, look here: https://docs.pinecone.io/guides/manage-data/manage-document-chunks\n",
+ "# To learn more, look here: https://docs.pinecone.io/guides/index-data/data-modeling\n",
"\n",
"vector_store.add_documents(documents=pinecone_docs, ids=ids)\n"
]
@@ -994,45 +1067,38 @@
},
{
"cell_type": "code",
- "execution_count": 20,
+ "execution_count": 13,
"metadata": {},
"outputs": [],
"source": [
"from langchain.chat_models import init_chat_model\n",
"\n",
- "llm = init_chat_model(\"gpt-4o-mini\", model_provider=\"openai\")"
+ "\n",
+ "# Note that as of 08-12-2025, the cutoff for GPT-5 is Sept 29, 2024.\n",
+ "# If you don't have access yet, gpt-4o-mini works great!\n",
+ "\n",
+ "llm = init_chat_model(\"gpt-5\", model_provider=\"openai\")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "Next, let's run a query and retrieve some documents. These will be what is ultimately passed to our LLM that uses Pinecone to answer queries. "
]
},
{
"cell_type": "code",
- "execution_count": 27,
+ "execution_count": 20,
"metadata": {},
"outputs": [],
"source": [
- "#OpenAI models will be unable to answer this due to training cutoffs in 2023-2024\n",
+ "# OpenAI models will be unable to answer this due to training cutoffs in 2023-2024\n",
"\n",
"query = \"Tell me about version 7.0 of the Pinecone Python SDK\"\n",
"\n",
"retrieved_docs = vector_store.similarity_search(query, k=5)\n",
- "docs_content = \"\\n\\n\".join(doc.page_content for doc in retrieved_docs)\n",
- "\n",
- "prompt = f'''You are an assistant that answers questions exclusively about the \n",
- "Pinecone SDK release notes:\n",
- "\n",
- "Here's a question: {query}\n",
- "\n",
- "Here's some context from the release notes:\n",
- "\n",
- "{docs_content}\n",
- "\n",
- "\n",
- "Question: {query}\n",
- "\n",
- "Answer:\n",
- "'''\n",
- "\n",
- "# This will take a few seconds to run, due to the generation of the response from OpenAI\n",
- "answer = llm.invoke(prompt)"
+ "docs_content = \"\\n\\n\".join(doc.page_content for doc in retrieved_docs)"
]
},
{
@@ -1046,7 +1112,7 @@
},
{
"cell_type": "code",
- "execution_count": 30,
+ "execution_count": 21,
"metadata": {},
"outputs": [
{
@@ -1058,14 +1124,17 @@
" \n",
"\n",
"Metadata:\n",
- "{'chunk_num': 4.0, 'feature': 'Released Python SDK v7.0.1 and v7.0.2', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "{'chunk_num': 18.0, 'feature': 'Released Python SDK v7.0.1 and v7.0.2', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
"----------------------------------------------------------------------------------------------------\n",
"Doc number: 2\n",
- "Released [`v7.0.1`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.1) and [`v7.0.2`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.2) of the [Pinecone Python SDK](/reference/python-sdk). These versions fix minor bugs discovered since the release of the `v7.0.0` major version.\n",
+ "Released [`v7.1.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.1.0), [`v7.2.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.2.0), and [`v7.3.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.3.0) of the [Pinecone Python SDK](/reference/python-sdk). \n",
+ "* `v7.1.0` fixes minor bugs.\n",
+ "* `v7.2.0` adds support for [managing namespaces](/guides/manage-data/manage-namespaces).\n",
+ "* `v7.3.0` adds support for admin API operations for working with API keys, projects, and service accounts.\n",
" \n",
- "\n",
+ "\n",
"Metadata:\n",
- "{'chunk_num': 4.0, 'feature': 'Released Python SDK v7.0.1 and v7.0.2', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "{'chunk_num': 11.0, 'feature': 'Released Python SDK v7.1.0, v7.2.0, and v7.3.0', 'month_year': 'June 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
"----------------------------------------------------------------------------------------------------\n",
"Doc number: 3\n",
"Released [`v7.0.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.0) of the [Pinecone Python SDK](/reference/python-sdk). This version uses the latest stable API version, `2025-04`, and includes support for the following: \n",
@@ -1078,22 +1147,9 @@
" \n",
"\n",
"Metadata:\n",
- "{'chunk_num': 7.0, 'feature': 'Released Python SDK v7.0.0', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "{'chunk_num': 21.0, 'feature': 'Released Python SDK v7.0.0', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
"----------------------------------------------------------------------------------------------------\n",
"Doc number: 4\n",
- "Released [`v7.0.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.0) of the [Pinecone Python SDK](/reference/python-sdk). This version uses the latest stable API version, `2025-04`, and includes support for the following: \n",
- "* [Creating and managing backups](/guides/manage-data/back-up-an-index)\n",
- "* [Restoring indexes from backups](/guides/manage-data/restore-an-index)\n",
- "* [Listing embedding and reranking models hosted by Pinecone](/reference/api/2025-04/inference/list_models)\n",
- "* [Getting details about a model hosted by Pinecone](/reference/api/2025-04/inference/describe_model)\n",
- "* [Creating a BYOC index](/guides/production/bring-your-own-cloud#create-an-index) \n",
- "Additionally, the `pinecone-plugin-assistant` package required to work with [Pinecone Assistant](/guides/assistant/overview) is now included by default; it is no longer necessary to install the plugin separately.\n",
- " \n",
- "\n",
- "Metadata:\n",
- "{'chunk_num': 7.0, 'feature': 'Released Python SDK v7.0.0', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
- "----------------------------------------------------------------------------------------------------\n",
- "Doc number: 5\n",
"Released [`v6.0.0`](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v6.0.0) of the [Pinecone Python SDK](/reference/python-sdk). This version uses the latest stable API version, `2025-01`, and includes support for the following: \n",
"* [Index tags](/guides/manage-data/manage-indexes#configure-index-tags) to categorize and identify your indexes.\n",
"* [Integrated inference](/reference/api/introduction#inference) without the need for extra plugins. If you were using the preview functionality of integrated inference, you must uninstall the `pinecone-plugin-records` package to use the `v6.0.0` release.\n",
@@ -1109,7 +1165,19 @@
" \n",
"\n",
"Metadata:\n",
- "{'chunk_num': 38.0, 'feature': 'Released Python SDK v6.0.0', 'month_year': 'February 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "{'chunk_num': 52.0, 'feature': 'Released Python SDK v6.0.0', 'month_year': 'February 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Doc number: 5\n",
+ "Released [`v6.0.0`](https://github.com/pinecone-io/pinecone-ts-client/releases/tag/v6.0.0) of the [Pinecone Node.js SDK](/reference/node-sdk). This version uses the latest stable API version, `2025-04`, and includes support for the following: \n",
+ "* [Managing namespaces](/guides/manage-data/manage-namespaces)\n",
+ "* [Creating and managing backups](/guides/manage-data/back-up-an-index)\n",
+ "* [Restoring indexes from backups](/guides/manage-data/restore-an-index)\n",
+ "* [Listing embedding and reranking models hosted by Pinecone](/reference/api/2025-04/inference/list_models)\n",
+ "* [Getting details about a model hosted by Pinecone](/reference/api/2025-04/inference/describe_model)\n",
+ " \n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 22.0, 'feature': 'Released Node.js SDK v6.0.0', 'month_year': 'May 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
"----------------------------------------------------------------------------------------------------\n"
]
}
@@ -1120,7 +1188,7 @@
" print(d.page_content)\n",
" print(\"Metadata:\")\n",
" print(d.metadata)\n",
- " print(\"-\"*100)\n"
+ " print(\"-\"*100)"
]
},
{
@@ -1140,21 +1208,55 @@
},
{
"cell_type": "code",
- "execution_count": 23,
+ "execution_count": 22,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
- "As of my last update in October 2023, Pinecone frequently releases updates to enhance its features, performance, and usability. To find the most recent major feature release for the Pinecone Python SDK, I recommend checking the official Pinecone documentation or their GitHub repository. They typically have a changelog that outlines new features, improvements, and bug fixes.\n",
+ "I don’t have release notes for Pinecone’s Python SDK version 7.0 in my training data (my knowledge goes up to Oct 2024), and I don’t want to guess. A couple of quick clarifications and ways to get the exact details:\n",
+ "\n",
+ "Questions\n",
+ "- Do you mean the “pinecone” package or “pinecone-client”? They are different packages, and their version numbers may not match.\n",
+ "- Are you looking for new features, breaking changes, or migration guidance?\n",
+ "\n",
+ "How to find the v7.0 details right now\n",
+ "- PyPI release notes:\n",
+ " - pinecone: https://pypi.org/project/pinecone/\n",
+ " - pinecone-client: https://pypi.org/project/pinecone-client/\n",
+ "- GitHub changelog (pinecone-io org): look for the repository of the package you use (commonly “pinecone-python”) and open CHANGELOG.md or Releases.\n",
+ "- Docs: https://docs.pinecone.io (search “Python SDK” and “migration guide”).\n",
"\n",
- "If you're looking for specific features or improvements released recently, you can always visit the Pinecone website or their community forums for announcements or summaries of the latest updates. If you have any specific functionality in mind that you're interested in, feel free to ask!\n"
+ "Commands to check and upgrade locally\n",
+ "- Check which package/version you have:\n",
+ " - pip show pinecone\n",
+ " - pip show pinecone-client\n",
+ " - python -c \"import pinecone, sys; print('pinecone', getattr(pinecone, '__version__', 'unknown'))\"\n",
+ "- Upgrade:\n",
+ " - pip install -U pinecone\n",
+ " - or pip install -U pinecone-client\n",
+ "\n",
+ "What to look for in a major (7.0) release\n",
+ "- Breaking API changes (method/class renames or moved modules)\n",
+ "- Deprecations/removals (older index types or parameters)\n",
+ "- Auth/init changes (e.g., Pinecone(api_key=...) vs init functions)\n",
+ "- Index create specs and defaults (dimension/metric, serverless vs pod settings)\n",
+ "- Data model tweaks (upsert/query payload/response shapes)\n",
+ "- Retry/timeout behavior and error classes\n",
+ "- New features (batching, streaming, filters, hybrid/search, inference hooks)\n",
+ "\n",
+ "If you can share:\n",
+ "- Which package (“pinecone” or “pinecone-client”)\n",
+ "- The current version you’re on\n",
+ "- A snippet of how you currently initialize, upsert, and query\n",
+ "\n",
+ "…I can map that to 7.0 and give you precise, step-by-step migration guidance.\n"
]
}
],
"source": [
- "print(llm.invoke(\"Tell about the most recent major feature release in the Pinecone Python SDK\").content)"
+ "print(llm.invoke(query).content)"
]
},
{
@@ -1166,37 +1268,196 @@
},
{
"cell_type": "code",
- "execution_count": 24,
+ "execution_count": 23,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Here’s what’s in the Pinecone Python SDK 7.0 line:\n",
+ "\n",
+ "- v7.0.0 (2025-06-16): Moves to API version 2025-04 and adds:\n",
+ " - Creating and managing backups\n",
+ " - Restoring indexes from backups\n",
+ " - Listing and describing Pinecone-hosted embedding and reranking models\n",
+ " - Creating Bring Your Own Cloud (BYOC) indexes\n",
+ " - pinecone-plugin-assistant included by default (no separate install needed)\n",
+ "- v7.0.1 and v7.0.2: Patch releases that fix minor bugs discovered after v7.0.0.\n"
+ ]
+ }
+ ],
+ "source": [
+ "prompt = f'''You are an assistant that answers questions exclusively about the \n",
+ "Pinecone SDK release notes:\n",
+ "\n",
+ "Here's a question: {query}\n",
+ "\n",
+ "Here's some context from the release notes:\n",
+ "\n",
+ "{docs_content}\n",
+ "\n",
+ "Answer:\n",
+ "'''\n",
+ "\n",
+ "# This will take a few seconds to run, due to the generation of the response from OpenAI\n",
+ "answer = llm.invoke(prompt)\n",
+ "\n",
+ "print(answer.content)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "## Wrapping it all in a function"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 33,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def generate_response(query, use_pinecone=False):\n",
+ " # Function to easily generate a response with and without Pinecone data\n",
+ "\n",
+ " if use_pinecone:\n",
+ " retrieved_docs = vector_store.similarity_search(query, k=5)\n",
+ " docs_content = \"\\n\\n\".join(doc.page_content for doc in retrieved_docs)\n",
+ " prompt = f'''\n",
+ " You are an assistant that answers questions exclusively about the \n",
+ " Pinecone SDK release notes:\n",
+ "\n",
+ " Here's a question: {query}\n",
+ "\n",
+ " Here's some context from the release notes:\n",
+ "\n",
+ " {docs_content}\n",
+ "\n",
+ " Answer: '''\n",
+ "\n",
+ " #print out retrieved documents\n",
+ " print(\"Retrieved documents:.....\")\n",
+ " for num, d in enumerate(retrieved_docs):\n",
+ " print(f\"Doc number: {num+1}\")\n",
+ " print(d.page_content)\n",
+ " print(\"Metadata:\")\n",
+ " print(d.metadata)\n",
+ " print(\"-\"*100)\n",
+ " print(\"Chatbot response:.....\")\n",
+ "\n",
+ " return llm.invoke(prompt).content\n",
+ " else:\n",
+ " # no context is passed\n",
+ " return llm.invoke(query).content\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 34,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
- "The Pinecone Python SDK version 7.0 includes a major release (`v7.0.0`) and subsequent minor updates (`v7.0.1` and `v7.0.2`) that address minor bugs.\n",
+ "Short answer: Pinecone’s sparse encoder used to be effectively limited to ~512 tokens (BERT-era limit). Recently, Pinecone raised the usable context window by adding server-side chunk-and-merge, so you can pass much longer inputs and get a single sparse vector back. In practice, this means you no longer need to manually chunk long documents just to get a usable sparse embedding.\n",
"\n",
- "### Version 7.0.0\n",
- "Released on May 19, 2025, this version utilizes the latest stable API version, `2025-04`, and offers several new features:\n",
- "- **Creating and managing backups**: Users can now create and manage backups of their indexes.\n",
- "- **Restoring indexes from backups**: This feature allows users to restore their indexes from previously created backups.\n",
- "- **Listing embedding and reranking models**: Users can list models that are hosted by Pinecone.\n",
- "- **Getting model details**: This feature provides detailed information about a specific model hosted by Pinecone.\n",
- "- **Creating a BYOC (Bring Your Own Cloud) index**: Users are now able to create indexes within their own cloud environments.\n",
+ "What changed\n",
+ "- Longer inputs accepted: You can now send texts far beyond 512 tokens; the service splits them internally and merges the term weights into one sparse vector. This improves recall on long documents and simplifies pipelines.\n",
+ "- Smarter merging: The merger reduces double-counting of repeated terms across chunks and normalizes weights, helping stability vs. naive summation.\n",
+ "- Progressive limits: The maximum accepted input length has been increased from the original 512-token ceiling to a much larger cap (the exact hard limit can change as they roll out updates).\n",
"\n",
- "Additionally, the `pinecone-plugin-assistant` package, which is needed for working with Pinecone Assistant, is now included by default, eliminating the need for a separate installation.\n",
+ "How to confirm the current limit\n",
+ "- Check the pinecone-sparse model card in Pinecone’s docs or the Inference “Models” page.\n",
+ "- Call the models/list or embeddings create endpoint and look for the model’s max input length; if you exceed it, the API error usually reports the current cap.\n",
+ "- Review the Pinecone changelog or release notes for “pinecone-sparse” (they’ve been incrementally expanding the window).\n",
"\n",
- "### Minor Versions: 7.0.1 and 7.0.2\n",
- "Released on May 29, 2025, versions `7.0.1` and `7.0.2` were released to fix minor bugs that had been discovered after the `v7.0.0` major release.\n",
+ "Practical guidance\n",
+ "- You can now pass full sections/long pages directly. If you still prefer control, client-side chunking at 800–1,200 tokens with slight overlap works well; the server-side merge will still help.\n",
+ "- For hybrid search, keep an eye on term-weight saturation with very long inputs; consider light client-side chunking if you need fine-grained retrieval.\n",
"\n",
- "For more details, you can view the release notes for each version: \n",
- "- [v7.0.0](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.0)\n",
- "- [v7.0.1](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.1)\n",
- "- [v7.0.2](https://github.com/pinecone-io/pinecone-python-client/releases/tag/v7.0.2)\n"
+ "If you can share the timeframe or a link to the announcement you’re referring to, I can tailor this to the exact version and hard token limit you’re targeting.\n"
]
}
],
"source": [
- "print(answer.content)"
+ "query = \"Tell me about recent changes to the pinecone-sparse embedding model context window\"\n",
+ "\n",
+ "print(generate_response(query, use_pinecone=False))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 35,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Retrieved documents:.....\n",
+ "Doc number: 1\n",
+ "You can now raise the context window for Pinecone's hosted [`pinecone-sparse-english-v0`](/guides/index-data/create-an-index#pinecone-sparse-english-v0) embedding model from `512` to `2048` using the `max_tokens_per_sequence` parameter.\n",
+ " \n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 5.0, 'feature': 'Increased context window for `pinecone-sparse-english-v0`', 'month_year': 'July 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Doc number: 2\n",
+ "Pinecone Inference now supports [`pinecone-sparse-english-v0`](/guides/search/rerank-results#pinecone-sparse-english-v0), Pinecone's sparse embedding model, which estimates the lexical importance of tokens by leveraging their context, unlike traditional retrieval models like BM25, which rely solely on term frequency. This model is in [public preview](/release-notes/feature-availability).\n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 12.0, 'feature': 'Launch week: Released `pinecone-sparse-english-v0`', 'month_year': 'December 2024', 'release': '2024 releases', 'source': 'https://docs.pinecone.io/release-notes/2024.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Doc number: 3\n",
+ "Released [`v3.0.0`](https://github.com/pinecone-io/pinecone-dotnet-client/releases/tag/3.0.0) of the [Pinecone .NET SDK](/reference/dotnet-sdk). This version uses the latest stable API version, `2025-01`, and adds support for [sparse-only indexes](/guides/index-data/indexing-overview#sparse-indexes). \n",
+ "\n",
+ "Before upgrading to `v3.0.0`, update all relevant code to account for the following [breaking changes](/reference/api/versioning#breaking-changes). See the [`v3.0.0`](https://github.com/pinecone-io/pinecone-dotnet-client/releases/tag/3.0.0) release notes for full details. \n",
+ "* [`embed` operation](/reference/api/2025-01/inference/generate-embeddings):\n",
+ "* The `Embedding` type has changed from a simple object to a discriminated union, supporting both `DenseEmbedding` and `SparseEmbedding`. New helper methods available on the Embedding type: `IsDense` and `IsSparse` for type checking, `AsDense()` and `AsSparse()` for type conversion, and `Match()` and `Visit()` for pattern matching.\n",
+ "* The `Parameters` property now uses `Dictionary?` instead of `EmbedRequestParameters`. \n",
+ "* `rerank` operation:\n",
+ "* The `Document` property now uses `Dictionary?` instead of `Dictionary?`.\n",
+ "* The `Parameters` property now uses `Dictionary?` instead of `Dictionary?`.\n",
+ "\n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 55.0, 'feature': 'Released .NET SDK v3.0.0', 'month_year': 'February 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Doc number: 4\n",
+ "Released [`v4.0.0`](https://github.com/pinecone-io/pinecone-java-client/releases/tag/v4.0.0) of the [Pinecone Java SDK](/reference/java-sdk). This version uses the latest stable API version, `2025-01`, and adds support for [sparse-only indexes](/guides/index-data/indexing-overview#sparse-indexes). \n",
+ "\n",
+ "Before upgrading to `v4.0.0`, update all relevant code to account for the following [breaking changes](/reference/api/versioning#breaking-changes). See the [`v4.0.0`](https://github.com/pinecone-io/pinecone-java-client/releases/tag/v4.0.0) release notes for full details. \n",
+ "* [`embed` method](/reference/api/2025-01/inference/generate-embeddings):\n",
+ "* `parameters` now accepts `Map` instead of `EmbedRequestParameters`.\n",
+ "* The `Embeddings` response class now has dense and sparse embeddings. You now must use `getDenseEmbedding()` or `getSparseEmbedding()`. For example, instead of `embeddings.getData().get(0).getValues()`, you would use `embeddings.getData().get(0).getDenseEmbedding().getValues()`. \n",
+ "* [`rerank` method](/guides/search/rerank-results):\n",
+ "* `documents` now accepts `List\n",
+ " \n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 53.0, 'feature': 'Released Java SDK v4.0.0', 'month_year': 'February 2025', 'release': '2025 releases', 'source': 'https://docs.pinecone.io/release-notes/2025.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Doc number: 5\n",
+ "You can now use [embedding models](/guides/index-data/create-an-index#embedding-models) and [reranking models](/guides/search/rerank-results#reranking-models) hosted on Pinecone as an integrated part of upserting and searching.\n",
+ " \n",
+ "\n",
+ "Metadata:\n",
+ "{'chunk_num': 9.0, 'feature': 'Launch week: Integrated Inference', 'month_year': 'December 2024', 'release': '2024 releases', 'source': 'https://docs.pinecone.io/release-notes/2024.md'}\n",
+ "----------------------------------------------------------------------------------------------------\n",
+ "Chatbot response:.....\n",
+ "- You can now raise the context window for Pinecone’s hosted pinecone-sparse-english-v0 embedding model from 512 to 2048 tokens.\n",
+ "- Set the max_tokens_per_sequence parameter to increase the limit.\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(generate_response(query, use_pinecone=True))"
]
},
{
@@ -1216,7 +1477,7 @@
},
{
"cell_type": "code",
- "execution_count": 226,
+ "execution_count": 36,
"metadata": {
"id": "PpJp-xExFeLa"
},
@@ -1240,7 +1501,7 @@
"provenance": []
},
"kernelspec": {
- "display_name": "Python 3 (ipykernel)",
+ "display_name": "pinecone-examples",
"language": "python",
"name": "python3"
},
@@ -1255,11 +1516,6 @@
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.9"
- },
- "vscode": {
- "interpreter": {
- "hash": "57376684f67c5d7b1589c855d7d0f1a1bdf8944ab1b903e711fdbf39434567bb"
- }
}
},
"nbformat": 4,