weaviate
diff --git a/‎.github/dependabot.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/dependabot.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎ci/docker-compose-wcs.yml‎
Lines changed: 3 additions & 3 deletions b/‎ci/docker-compose-wcs.yml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎docs/changelog.rst‎
Lines changed: 14 additions & 1 deletion b/‎docs/changelog.rst‎
Lines changed: 14 additions & 1 deletion
diff --git a/‎integration/test_backup_v4.py‎
Lines changed: 0 additions & 1 deletion b/‎integration/test_backup_v4.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎integration/test_client.py‎
Lines changed: 1 addition & 1 deletion b/‎integration/test_client.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎integration/test_collection_config.py‎
Lines changed: 4 additions & 2 deletions b/‎integration/test_collection_config.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎integration/test_collection_filter.py‎
Lines changed: 8 additions & 1 deletion b/‎integration/test_collection_filter.py‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎integration/test_collection_openai.py‎
Lines changed: 167 additions & 0 deletions b/‎integration/test_collection_openai.py‎
Lines changed: 167 additions & 0 deletions
diff --git a/‎integration/test_collection_rerank.py‎
Lines changed: 58 additions & 0 deletions b/‎integration/test_collection_rerank.py‎
Lines changed: 58 additions & 0 deletions
diff --git a/‎requirements-devel.txt‎
Lines changed: 2 additions & 2 deletions b/‎requirements-devel.txt‎
Lines changed: 2 additions & 2 deletions
@@ -8,7 +8,7 @@ updates:
   - package-ecosystem: "pip" # See documentation for possible values
     directory: "/" # Location of package manifests
     schedule:
-      interval: "weekly"
+      interval: "monthly"
     ignore:
       - dependency-name: "grpcio"
       - dependency-name: "grpcio-tools"
 
@@ -19,10 +19,10 @@ services:
       PERSISTENCE_DATA_PATH: '/var/lib/weaviate'
       AUTHENTICATION_ANONYMOUS_ACCESS_ENABLED: 'false'
       AUTHENTICATION_OIDC_ENABLED: 'true'
-      AUTHENTICATION_OIDC_CLIENT_ID: 'wcs'
-      AUTHENTICATION_OIDC_ISSUER: 'https://auth.wcs.api.weaviate.io/auth/realms/SeMI'
+      AUTHENTICATION_OIDC_CLIENT_ID: 'Peuc12y02UA0eAED1dqSjE5HtGUrpBsx'
+      AUTHENTICATION_OIDC_ISSUER: 'https://auth.weaviate.cloud/Peuc12y02UA0eAED1dqSjE5HtGUrpBsx'
       AUTHENTICATION_OIDC_USERNAME_CLAIM: 'email'
-      AUTHENTICATION_OIDC_GROUPS_CLAIM: 'groups'
+      AUTHENTICATION_OIDC_GROUPS_CLAIM: 'roles'
       AUTHORIZATION_ADMINLIST_ENABLED: 'true'
       AUTHORIZATION_ADMINLIST_USERS: '[email protected]'
       AUTHENTICATION_OIDC_SCOPES: 'openid,email'
 
@@ -1,11 +1,24 @@
 Changelog
 =========
 
+Version 4.18.3
+--------------
+This patch version includes:
+    - Fixes wrong deprecation warning in PyCharm when creating a collection without vectorizers
+    - Fixes warnings with boolean filters
+
+Version 4.18.2
+--------------
+This patch version includes:
+    - Add support for contextual generative and reranker modules
+    - Add support for ZSTD compression in backups
+    - Add support for VoyageAI's voyage-3-large model
+
 Version 4.18.1
 --------------
 This patch version includes:
     - Add 'dimensions' param to cohere vectorizers  (feat/cohere-dimensions-param)
-    - Add dimensions parameter to text2vec-voyageai methods (feat/t2v-voyage-add-dimensions)
+    - Add 'dimensions' parameter to text2vec-voyageai methods (feat/t2v-voyage-add-dimensions)
 
 Version 4.18.0
 --------------
 
@@ -464,7 +464,6 @@ def test_backup_and_restore_with_collection_and_config_1_24_x(
         wait_for_completion=True,
         config=BackupConfigCreate(
             cpu_percentage=60,
-            chunk_size=256,
             compression_level=BackupCompressionLevel.BEST_SPEED,
         ),
     )
 
@@ -271,7 +271,7 @@ def test_create_export_and_recreate(client: weaviate.WeaviateClient, request: Su
     assert export.generative_config is not None
     assert export.generative_config.generative == GenerativeSearches.COHERE
     assert export.generative_config.model["model"] == "command-r-plus"
-    assert export.generative_config.model["kProperty"] == 10
+    assert export.generative_config.model["k"] == 10
 
     client.collections.delete([name1, name2])
     assert not client.collections.exists(name1)
 
@@ -913,9 +913,11 @@ def test_config_vector_index_hnsw_and_quantizer_pq(collection_factory: Collectio
     [
         (Configure.Reranker.cohere(), Rerankers.COHERE, {}),
         (
-            Configure.Reranker.cohere(model="rerank-english-v2.0"),
+            Configure.Reranker.cohere(
+                model="rerank-english-v2.0", base_url="https://some-cohere-baseurl.ai/"
+            ),
             Rerankers.COHERE,
-            {"model": "rerank-english-v2.0"},
+            {"model": "rerank-english-v2.0", "baseURL": "https://some-cohere-baseurl.ai/"},
         ),
         (Configure.Reranker.transformers(), Rerankers.TRANSFORMERS, {}),
     ],
 
@@ -278,13 +278,14 @@ def test_filters_comparison(
     ],
 )
 def test_filters_contains(
+    recwarn: pytest.WarningsRecorder,
     collection_factory: CollectionFactory,
     weaviate_filter: _FilterValue,
     results: List[int],
     require_version: Optional[tuple[int, int, int]],
 ) -> None:
     collection = collection_factory(
-        vectorizer_config=Configure.Vectorizer.none(),
+        vector_config=Configure.Vectors.self_provided(),
         properties=[
             Property(name="text", data_type=DataType.TEXT),
             Property(name="texts", data_type=DataType.TEXT_ARRAY),
@@ -380,6 +381,12 @@ def test_filters_contains(
     uuids = [uuids[result] for result in results]
     assert all(obj.uuid in uuids for obj in objects)
 
+    # Check for warnings to make sure booleans are handled as their correct type and are not sent as ints
+    if len(recwarn) != 0:
+        for rwarning in recwarn.list:
+            print(rwarning.message)
+    assert len(recwarn) == 0
+
 
 @pytest.mark.parametrize(
     "weaviate_filter,results",
 
@@ -740,3 +740,170 @@ def test_near_text_generate_with_dynamic_rag(
             assert g0.debug is None
             assert g0.metadata is None
             assert g1.metadata is None
+
+
+@pytest.mark.parametrize("parameter,answer", [("text", "yes"), ("content", "no")])
+def test_contextualai_generative_search_single(
+    collection_factory: CollectionFactory, parameter: str, answer: str
+) -> None:
+    """Test Contextual AI generative search with single prompt."""
+    api_key = os.environ.get("CONTEXTUAL_API_KEY")
+    if api_key is None:
+        pytest.skip("No Contextual AI API key found.")
+
+    collection = collection_factory(
+        name="TestContextualAIGenerativeSingle",
+        generative_config=Configure.Generative.contextualai(
+            model="v2",
+            max_new_tokens=100,
+            temperature=0.1,
+            system_prompt="You are a helpful assistant that provides accurate and informative responses based on the given context. Answer with yes or no only.",
+            avoid_commentary=False,
+        ),
+        vectorizer_config=Configure.Vectorizer.none(),
+        properties=[
+            Property(name="text", data_type=DataType.TEXT),
+            Property(name="content", data_type=DataType.TEXT),
+        ],
+        headers={"X-Contextual-Api-Key": api_key},
+        ports=(8086, 50057),
+    )
+    if collection._connection._weaviate_version.is_lower_than(1, 23, 1):
+        pytest.skip("Generative search requires Weaviate 1.23.1 or higher")
+
+    collection.data.insert_many(
+        [
+            DataObject(properties={"text": "bananas are great", "content": "bananas are bad"}),
+            DataObject(properties={"text": "apples are great", "content": "apples are bad"}),
+        ]
+    )
+
+    res = collection.generate.fetch_objects(
+        single_prompt=f"is it good or bad based on {{{parameter}}}? Just answer with yes or no without punctuation",
+    )
+    for obj in res.objects:
+        assert obj.generated is not None
+        assert obj.generated.lower() == answer
+    assert res.generated is None
+
+
+def test_contextualai_generative_with_knowledge_parameter(
+    collection_factory: CollectionFactory,
+) -> None:
+    """Test Contextual AI generative search with knowledge parameter override."""
+    api_key = os.environ.get("CONTEXTUAL_API_KEY")
+    if api_key is None:
+        pytest.skip("No Contextual AI API key found.")
+
+    collection = collection_factory(
+        name="TestContextualAIGenerativeKnowledge",
+        generative_config=Configure.Generative.contextualai(
+            model="v2",
+            max_new_tokens=100,
+            temperature=0.1,
+            system_prompt="You are a helpful assistant.",
+            avoid_commentary=False,
+        ),
+        vectorizer_config=Configure.Vectorizer.none(),
+        properties=[
+            Property(name="text", data_type=DataType.TEXT),
+        ],
+        headers={"X-Contextual-Api-Key": api_key},
+        ports=(8086, 50057),
+    )
+    if collection._connection._weaviate_version.is_lower_than(1, 23, 1):
+        pytest.skip("Generative search requires Weaviate 1.23.1 or higher")
+
+    collection.data.insert_many(
+        [
+            DataObject(properties={"text": "base knowledge"}),
+        ]
+    )
+
+    # Test with knowledge parameter override
+    res = collection.generate.fetch_objects(
+        single_prompt="What is the custom knowledge?",
+        config=GenerativeConfig.contextualai(
+            knowledge=["Custom knowledge override", "Additional context"],
+        ),
+    )
+    for obj in res.objects:
+        assert obj.generated is not None
+        assert isinstance(obj.generated, str)
+
+
+def test_contextualai_generative_and_rerank_combined(collection_factory: CollectionFactory) -> None:
+    """Test Contextual AI generative search combined with reranking."""
+    contextual_api_key = os.environ.get("CONTEXTUAL_API_KEY")
+    if contextual_api_key is None:
+        pytest.skip("No Contextual AI API key found.")
+
+    collection = collection_factory(
+        name="TestContextualAIGenerativeAndRerank",
+        generative_config=Configure.Generative.contextualai(
+            model="v2",
+            max_new_tokens=100,
+            temperature=0.1,
+            system_prompt="You are a helpful assistant that provides accurate and informative responses based on the given context.",
+            avoid_commentary=False,
+        ),
+        reranker_config=Configure.Reranker.contextualai(
+            model="ctxl-rerank-v2-instruct-multilingual",
+            instruction="Prioritize documents that contain the query term",
+        ),
+        vectorizer_config=Configure.Vectorizer.text2vec_openai(),
+        properties=[Property(name="text", data_type=DataType.TEXT)],
+        headers={"X-Contextual-Api-Key": contextual_api_key},
+        ports=(8086, 50057),
+    )
+    if collection._connection._weaviate_version < _ServerVersion(1, 23, 1):
+        pytest.skip("Generative reranking requires Weaviate 1.23.1 or higher")
+
+    insert = collection.data.insert_many(
+        [{"text": "This is a test"}, {"text": "This is another test"}]
+    )
+    uuid1 = insert.uuids[0]
+    vector1 = collection.query.fetch_object_by_id(uuid1, include_vector=True).vector
+    assert vector1 is not None
+
+    for _idx, query in enumerate(
+        [
+            lambda: collection.generate.bm25(
+                "test",
+                rerank=Rerank(prop="text", query="another"),
+                single_prompt="What is it? {text}",
+            ),
+            lambda: collection.generate.hybrid(
+                "test",
+                rerank=Rerank(prop="text", query="another"),
+                single_prompt="What is it? {text}",
+            ),
+            lambda: collection.generate.near_object(
+                uuid1,
+                rerank=Rerank(prop="text", query="another"),
+                single_prompt="What is it? {text}",
+            ),
+            lambda: collection.generate.near_vector(
+                vector1["default"],
+                rerank=Rerank(prop="text", query="another"),
+                single_prompt="What is it? {text}",
+            ),
+            lambda: collection.generate.near_text(
+                "test",
+                rerank=Rerank(prop="text", query="another"),
+                single_prompt="What is it? {text}",
+            ),
+        ]
+    ):
+        objects = query().objects
+        assert len(objects) == 2
+        assert objects[0].metadata.rerank_score is not None
+        assert objects[0].generated is not None
+        assert objects[1].metadata.rerank_score is not None
+        assert objects[1].generated is not None
+
+        assert [obj for obj in objects if "another" in obj.properties["text"]][  # type: ignore
+            0
+        ].metadata.rerank_score > [
+            obj for obj in objects if "another" not in obj.properties["text"]
+        ][0].metadata.rerank_score
@@ -138,3 +138,61 @@ def test_queries_with_rerank_and_group_by(collection_factory: CollectionFactory)
         ].rerank_score > [group for prop, group in ret.groups.items() if "another" not in prop][
             0
         ].rerank_score
+
+
+def test_queries_with_rerank_contextualai(collection_factory: CollectionFactory) -> None:
+    """Test Contextual AI reranker with various query types."""
+    api_key = os.environ.get("CONTEXTUAL_API_KEY")
+    if api_key is None:
+        pytest.skip("No Contextual AI API key found.")
+
+    collection = collection_factory(
+        name="Test_test_queries_with_rerank_contextualai",
+        reranker_config=wvc.config.Configure.Reranker.contextualai(
+            model="ctxl-rerank-v2-instruct-multilingual",
+            instruction="Prioritize documents that contain the query term",
+        ),
+        vectorizer_config=wvc.config.Configure.Vectorizer.text2vec_openai(),
+        properties=[wvc.config.Property(name="text", data_type=wvc.config.DataType.TEXT)],
+        headers={"X-Contextual-Api-Key": api_key},
+        ports=(8086, 50057),
+    )
+    if collection._connection._weaviate_version.is_lower_than(1, 23, 1):
+        pytest.skip("Reranking requires Weaviate 1.23.1 or higher")
+
+    insert = collection.data.insert_many(
+        [{"text": "This is a test"}, {"text": "This is another test"}]
+    )
+    uuid1 = insert.uuids[0]
+    vector1 = collection.query.fetch_object_by_id(uuid1, include_vector=True).vector
+    assert vector1 is not None
+
+    for _idx, query in enumerate(
+        [
+            lambda: collection.query.bm25(
+                "test", rerank=wvc.query.Rerank(prop="text", query="another")
+            ),
+            lambda: collection.query.hybrid(
+                "test", rerank=wvc.query.Rerank(prop="text", query="another")
+            ),
+            lambda: collection.query.near_object(
+                uuid1, rerank=wvc.query.Rerank(prop="text", query="another")
+            ),
+            lambda: collection.query.near_vector(
+                vector1["default"], rerank=wvc.query.Rerank(prop="text", query="another")
+            ),
+            lambda: collection.query.near_text(
+                "test", rerank=wvc.query.Rerank(prop="text", query="another")
+            ),
+        ]
+    ):
+        objects = query().objects
+        assert len(objects) == 2
+        assert objects[0].metadata.rerank_score is not None
+        assert objects[1].metadata.rerank_score is not None
+
+        assert [obj for obj in objects if "another" in obj.properties["text"]][  # type: ignore
+            0
+        ].metadata.rerank_score > [
+            obj for obj in objects if "another" not in obj.properties["text"]
+        ][0].metadata.rerank_score
@@ -17,7 +17,7 @@ sphinx-rtd-theme==3.0.2
 autodoc-pydantic==2.2.0
 importlib_metadata==8.7.0
 
-tomli==2.2.1
+tomli==2.3.0
 types-protobuf==6.30.2.20250703
 types-urllib3==1.26.25.14
 typing_extensions==4.14.1
@@ -29,4 +29,4 @@ flake8-comprehensions==3.17.0
 flake8-builtins==3.0.0
 flake8-docstrings==1.7.0
 pydoclint==0.7.3
-ruff==0.12.8
+ruff==0.14.7
Original file line number	Diff line number	Diff line change
`@@ -464,7 +464,6 @@ def test_backup_and_restore_with_collection_and_config_1_24_x(`
`464`	`464`	`wait_for_completion=True,`
`465`	`465`	`config=BackupConfigCreate(`
`466`	`466`	`cpu_percentage=60,`
`467`		`- chunk_size=256,`
`468`	`467`	`compression_level=BackupCompressionLevel.BEST_SPEED,`
`469`	`468`	`),`
`470`	`469`	`)`
Original file line number	Diff line number	Diff line change
`@@ -913,9 +913,11 @@ def test_config_vector_index_hnsw_and_quantizer_pq(collection_factory: Collectio`
`913`	`913`	`[`
`914`	`914`	`(Configure.Reranker.cohere(), Rerankers.COHERE, {}),`
`915`	`915`	`(`
`916`		`- Configure.Reranker.cohere(model="rerank-english-v2.0"),`
	`916`	`+ Configure.Reranker.cohere(`
	`917`	`+ model="rerank-english-v2.0", base_url="https://some-cohere-baseurl.ai/"`
	`918`	`+ ),`
`917`	`919`	`Rerankers.COHERE,`
`918`		`- {"model": "rerank-english-v2.0"},`
	`920`	`+ {"model": "rerank-english-v2.0", "baseURL": "https://some-cohere-baseurl.ai/"},`
`919`	`921`	`),`
`920`	`922`	`(Configure.Reranker.transformers(), Rerankers.TRANSFORMERS, {}),`
`921`	`923`	`],`