Skip to content

Commit a8e80cc

Browse files
committed
use more realistic vector values
1 parent c9319c9 commit a8e80cc

File tree

2 files changed

+23
-22
lines changed

2 files changed

+23
-22
lines changed

datastore/cloud-client/vector_search.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ def store_vectors():
2424
{
2525
"name": "Kahawa coffee beans",
2626
"description": "Information about the Kahawa coffee beans.",
27-
"embedding_field": Vector([1.0, 2.0, 3.0]),
27+
"embedding_field": Vector([0.18332680, 0.24160706, 0.3416704]),
2828
}
2929
)
3030

@@ -43,7 +43,7 @@ def vector_search_basic(db):
4343
kind="coffee-beans",
4444
find_nearest=FindNearest(
4545
vector_property="embedding_field",
46-
query_vector=Vector([3.0, 1.0, 2.0]),
46+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
4747
distance_measure=DistanceMeasure.EUCLIDEAN,
4848
limit=5,
4949
)
@@ -64,7 +64,7 @@ def vector_search_prefilter(db):
6464
filters=[PropertyFilter("color", "=", "red")],
6565
find_nearest=FindNearest(
6666
vector_property="embedding_field",
67-
query_vector=Vector([3.0, 1.0, 2.0]),
67+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
6868
distance_measure=DistanceMeasure.EUCLIDEAN,
6969
limit=5,
7070
)
@@ -83,7 +83,7 @@ def vector_search_distance_result_property(db):
8383
kind="coffee-beans",
8484
find_nearest=FindNearest(
8585
vector_property="embedding_field",
86-
query_vector=Vector([3.0, 1.0, 2.0]),
86+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
8787
distance_measure=DistanceMeasure.EUCLIDEAN,
8888
limit=5,
8989
distance_result_property="vector_distance",
@@ -105,7 +105,7 @@ def vector_search_distance_result_property_projection(db):
105105
kind="coffee-beans",
106106
find_nearest=FindNearest(
107107
vector_property="embedding_field",
108-
query_vector=Vector([3.0, 1.0, 2.0]),
108+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
109109
distance_measure=DistanceMeasure.EUCLIDEAN,
110110
limit=5,
111111
distance_result_property="vector_distance",
@@ -129,10 +129,10 @@ def vector_search_distance_threshold(db):
129129
kind="coffee-beans",
130130
find_nearest=FindNearest(
131131
vector_property="embedding_field",
132-
query_vector=Vector([3.0, 1.0, 2.0]),
132+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
133133
distance_measure=DistanceMeasure.EUCLIDEAN,
134134
limit=10,
135-
distance_threshold=4.5
135+
distance_threshold=0.4
136136
)
137137
)
138138

@@ -153,7 +153,7 @@ def vector_search_large_response(db):
153153
kind="coffee-beans",
154154
find_nearest=FindNearest(
155155
vector_property="embedding_field",
156-
query_vector=Vector([3.0, 1.0, 2.0]),
156+
query_vector=Vector([0.3416704, 0.18332680, 0.24160706]),
157157
distance_measure=DistanceMeasure.EUCLIDEAN,
158158
limit=100,
159159
distance_result_property="vector_distance",

datastore/cloud-client/vector_search_test.py

Lines changed: 15 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@
2121
from vector_search import store_vectors
2222
from vector_search import vector_search_basic
2323
from vector_search import vector_search_distance_result_property
24+
from vector_search import vector_search_distance_result_property_projection
2425
from vector_search import vector_search_distance_threshold
2526
from vector_search import vector_search_prefilter
2627
from vector_search import vector_search_large_response
@@ -49,13 +50,13 @@ def _clear_db(db):
4950

5051
def add_coffee_beans_data(db):
5152
entity1 = datastore.Entity(db.key("coffee-beans", "Arabica"))
52-
entity1.update({"embedding_field": Vector([10.0, 1.0, 2.0]), "color": "red"})
53+
entity1.update({"embedding_field": Vector([0.80522226, 0.18332680, 0.24160706]), "color": "red"})
5354
entity2 = datastore.Entity(db.key("coffee-beans", "Robusta"))
54-
entity2.update({"embedding_field": Vector([4.0, 1.0, 2.0]), "color": ""})
55+
entity2.update({"embedding_field": Vector([0.43979567, 0.18332680, 0.24160706]), "color": ""})
5556
entity3 = datastore.Entity(db.key("coffee-beans", "Excelsa"))
56-
entity3.update({"embedding_field": Vector([11.0, 1.0, 2.0]), "color": "red"})
57+
entity3.update({"embedding_field": Vector([0.90477061, 0.18332680, 0.24160706]), "color": "red"})
5758
entity4 = datastore.Entity(db.key("coffee-beans", "Liberica"))
58-
entity4.update({"embedding_field": Vector([3.0, 1.0, 2.0]), "color": "green"})
59+
entity4.update({"embedding_field": Vector([0.3416704, 0.18332680, 0.24160706]), "color": "green"})
5960

6061
entity_list = [entity1, entity2, entity3, entity4]
6162
db.put_multi(entity_list)
@@ -93,16 +94,16 @@ def test_vector_search_distance_result_property(db):
9394
assert len(results) == 4
9495
assert results[0].key.name == "Liberica"
9596
assert results[0]["vector_distance"] == 0.0
96-
assert results[0]["embedding_field"] == Vector([3.0, 1.0, 2.0])
97+
assert results[0]["embedding_field"] == Vector([0.3416704, 0.18332680, 0.24160706])
9798
assert results[1].key.name == "Robusta"
98-
assert results[1]["vector_distance"] == 1.0
99-
assert results[1]["embedding_field"] == Vector([4.0, 1.0, 2.0])
99+
assert results[1]["vector_distance"] == pytest.approx(0.09812527)
100+
assert results[1]["embedding_field"] == Vector([0.43979567, 0.18332680, 0.24160706])
100101
assert results[2].key.name == "Arabica"
101-
assert results[2]["vector_distance"] == 7.0
102-
assert results[2]["embedding_field"] == Vector([10.0, 1.0, 2.0])
102+
assert results[2]["vector_distance"] == pytest.approx(0.46355186)
103+
assert results[2]["embedding_field"] == Vector([0.80522226, 0.18332680, 0.24160706])
103104
assert results[3].key.name == "Excelsa"
104-
assert results[3]["vector_distance"] == 8.0
105-
assert results[3]["embedding_field"] == Vector([11.0, 1.0, 2.0])
105+
assert results[3]["vector_distance"] == pytest.approx(0.56310021)
106+
assert results[3]["embedding_field"] == Vector([0.90477061, 0.18332680, 0.24160706])
106107

107108

108109
def test_vector_search_distance_result_property_projection(db):
@@ -113,11 +114,11 @@ def test_vector_search_distance_result_property_projection(db):
113114
assert results[0].key.name == "Liberica"
114115
assert results[0]["vector_distance"] == 0.0
115116
assert results[1].key.name == "Robusta"
116-
assert results[1]["vector_distance"] == 1.0
117+
assert results[1]["vector_distance"] == pytest.approx(0.09812527)
117118
assert results[2].key.name == "Arabica"
118-
assert results[2]["vector_distance"] == 7.0
119+
assert results[2]["vector_distance"] == pytest.approx(0.46355186)
119120
assert results[3].key.name == "Excelsa"
120-
assert results[3]["vector_distance"] == 8.0
121+
assert results[3]["vector_distance"] == pytest.approx(0.56310021)
121122

122123
assert all("embedding_field" not in d for d in results)
123124

0 commit comments

Comments
 (0)