Skip to content

Commit 6a4711d

Browse files
Yuri ZmytrakovYuri Zmytrakov
authored andcommitted
fix: the default and max allowed returned values for collections and items
Ensure collections and items endpoints use their respective default and maximum limit values.
1 parent 7065798 commit 6a4711d

File tree

8 files changed

+175
-88
lines changed

8 files changed

+175
-88
lines changed

CHANGELOG.md

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,9 @@ and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.
1111

1212
### Changed
1313

14+
- Removed ENV_MAX_LIMIT environment variable; maximum limits are now handled by the default global limit environment variable. [#482](https://github.com/stac-utils/stac-fastapi-elasticsearch-opensearch/pull/482)
15+
- Changed the default and maximum pagination limits for collections/items endpoints. [#482](https://github.com/stac-utils/stac-fastapi-elasticsearch-opensearch/pull/482)
16+
1417
### Fixed
1518

1619
[v6.5.0] - 2025-09-29

README.md

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -299,9 +299,11 @@ You can customize additional settings in your `.env` file:
299299
| `ENABLE_COLLECTIONS_SEARCH` | Enable collection search extensions (sort, fields, free text search, structured filtering, and datetime filtering) on the core `/collections` endpoint. | `true` | Optional |
300300
| `ENABLE_COLLECTIONS_SEARCH_ROUTE` | Enable the custom `/collections-search` endpoint (both GET and POST methods). When disabled, the custom endpoint will not be available, but collection search extensions will still be available on the core `/collections` endpoint if `ENABLE_COLLECTIONS_SEARCH` is true. | `false` | Optional |
301301
| `ENABLE_TRANSACTIONS_EXTENSIONS` | Enables or disables the Transactions and Bulk Transactions API extensions. This is useful for deployments where mutating the catalog via the API should be prevented. If set to `true`, the POST `/collections` route for search will be unavailable in the API. | `true` | Optional |
302-
| `STAC_ITEM_LIMIT` | Sets the environment variable for result limiting to SFEOS for the number of returned items and STAC collections. | `10` | Optional |
302+
| `STAC_GLOBAL_COLLECTION_MAX_LIMIT` | Configures the maximum number of STAC collections that can be returned in a single search request. | N/A | Optional |
303+
| `STAC_DEFAULT_COLLECTION_LIMIT` | Configures the default number of STAC collections returned when no limit parameter is specified in the request. | `300` | Optional |
304+
| `STAC_GLOBAL_ITEM_MAX_LIMIT` | Configures the maximum number of STAC items that can be returned in a single search request. | N/A | Optional |
305+
| `STAC_DEFAULT_ITEM_LIMIT` | Configures the default number of STAC items returned when no limit parameter is specified in the request. | `10` | Optional |
303306
| `STAC_INDEX_ASSETS` | Controls if Assets are indexed when added to Elasticsearch/Opensearch. This allows asset fields to be included in search queries. | `false` | Optional |
304-
| `ENV_MAX_LIMIT` | Configures the environment variable in SFEOS to override the default `MAX_LIMIT`, which controls the limit parameter for returned items and STAC collections. | `10,000` | Optional |
305307
| `USE_DATETIME` | Configures the datetime search behavior in SFEOS. When enabled, searches both datetime field and falls back to start_datetime/end_datetime range for items with null datetime. When disabled, searches only by start_datetime/end_datetime range. | `true` | Optional |
306308

307309
> [!NOTE]

stac_fastapi/core/stac_fastapi/core/core.py

Lines changed: 44 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -270,33 +270,31 @@ async def all_collections(
270270
base_url = str(request.base_url)
271271

272272
# Get the global limit from environment variable
273-
global_limit = None
274-
env_limit = os.getenv("STAC_ITEM_LIMIT")
275-
if env_limit:
276-
try:
277-
global_limit = int(env_limit)
278-
except ValueError:
279-
# Handle invalid integer in environment variable
280-
pass
281-
282-
# Apply global limit if it exists
283-
if global_limit is not None:
284-
# If a limit was provided, use the smaller of the two
285-
if limit is not None:
286-
limit = min(limit, global_limit)
287-
else:
288-
limit = global_limit
273+
global_max_limit_env = os.getenv("STAC_GLOBAL_COLLECTION_MAX_LIMIT")
274+
if global_max_limit_env is not None:
275+
global_max_limit = int(global_max_limit_env)
289276
else:
290-
# No global limit, use provided limit or default
291-
if limit is None:
292-
query_limit = request.query_params.get("limit")
293-
if query_limit:
294-
try:
295-
limit = int(query_limit)
296-
except ValueError:
297-
limit = 10
298-
else:
299-
limit = 10
277+
global_max_limit = None
278+
default_limit = int(os.getenv("STAC_DEFAULT_COLLECTION_LIMIT", 300))
279+
query_limit = request.query_params.get("limit")
280+
281+
body_limit = None
282+
try:
283+
if request.method == "POST" and request.body():
284+
body_data = await request.json()
285+
body_limit = body_data.get("limit")
286+
except Exception:
287+
pass
288+
289+
if body_limit is not None:
290+
limit = int(body_limit)
291+
elif query_limit:
292+
limit = int(query_limit)
293+
else:
294+
limit = default_limit
295+
296+
if global_max_limit is not None:
297+
limit = min(limit, global_max_limit)
300298

301299
token = request.query_params.get("token")
302300

@@ -562,7 +560,7 @@ async def item_collection(
562560
request (Request): FastAPI Request object.
563561
bbox (Optional[BBox]): Optional bounding box filter.
564562
datetime (Optional[str]): Optional datetime or interval filter.
565-
limit (Optional[int]): Optional page size. Defaults to env ``STAC_ITEM_LIMIT`` when unset.
563+
limit (Optional[int]): Optional page size. Defaults to env `STAC_DEFAULT_ITEM_LIMIT` when unset.
566564
sortby (Optional[str]): Optional sort specification. Accepts repeated values
567565
like ``sortby=-properties.datetime`` or ``sortby=+id``. Bare fields (e.g. ``sortby=id``)
568566
imply ascending order.
@@ -653,15 +651,12 @@ async def get_search(
653651
q (Optional[List[str]]): Free text query to filter the results.
654652
intersects (Optional[str]): GeoJSON geometry to search in.
655653
kwargs: Additional parameters to be passed to the API.
656-
657654
Returns:
658655
ItemCollection: Collection of `Item` objects representing the search results.
659656
660657
Raises:
661658
HTTPException: If any error occurs while searching the catalog.
662659
"""
663-
limit = int(request.query_params.get("limit", os.getenv("STAC_ITEM_LIMIT", 10)))
664-
665660
base_args = {
666661
"collections": collections,
667662
"ids": ids,
@@ -736,6 +731,25 @@ async def post_search(
736731
Raises:
737732
HTTPException: If there is an error with the cql2_json filter.
738733
"""
734+
global_max_limit_env = os.getenv("STAC_GLOBAL_ITEM_MAX_LIMIT")
735+
if global_max_limit_env is not None:
736+
global_max_limit = int(global_max_limit_env)
737+
else:
738+
global_max_limit = None
739+
default_limit = int(os.getenv("STAC_DEFAULT_ITEM_LIMIT", 10))
740+
741+
requested_limit = getattr(search_request, "limit", None)
742+
743+
if requested_limit is None:
744+
limit = default_limit
745+
else:
746+
limit = requested_limit
747+
748+
if global_max_limit:
749+
limit = min(limit, global_max_limit)
750+
751+
search_request.limit = limit
752+
739753
base_url = str(request.base_url)
740754

741755
search = self.database.make_search()
@@ -812,10 +826,6 @@ async def post_search(
812826
if hasattr(search_request, "sortby") and getattr(search_request, "sortby"):
813827
sort = self.database.populate_sort(getattr(search_request, "sortby"))
814828

815-
limit = 10
816-
if search_request.limit:
817-
limit = search_request.limit
818-
819829
# Use token from the request if the model doesn't define it
820830
token_param = getattr(
821831
search_request, "token", None

stac_fastapi/core/stac_fastapi/core/utilities.py

Lines changed: 1 addition & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -10,15 +10,7 @@
1010

1111
from stac_fastapi.types.stac import Item
1212

13-
14-
def get_max_limit():
15-
"""
16-
Retrieve a MAX_LIMIT value from an environment variable.
17-
18-
Returns:
19-
int: The int value parsed from the environment variable.
20-
"""
21-
return int(os.getenv("ENV_MAX_LIMIT", 10000))
13+
MAX_LIMIT = 10000
2214

2315

2416
def get_bool_env(name: str, default: Union[bool, str] = False) -> bool:

stac_fastapi/elasticsearch/stac_fastapi/elasticsearch/database_logic.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717

1818
from stac_fastapi.core.base_database_logic import BaseDatabaseLogic
1919
from stac_fastapi.core.serializers import CollectionSerializer, ItemSerializer
20-
from stac_fastapi.core.utilities import bbox2polygon, get_bool_env, get_max_limit
20+
from stac_fastapi.core.utilities import MAX_LIMIT, bbox2polygon, get_bool_env
2121
from stac_fastapi.elasticsearch.config import AsyncElasticsearchSettings
2222
from stac_fastapi.elasticsearch.config import (
2323
ElasticsearchSettings as SyncElasticsearchSettings,
@@ -818,7 +818,7 @@ async def execute_search(
818818
index_param = ITEM_INDICES
819819
query = add_collections_to_body(collection_ids, query)
820820

821-
max_result_window = get_max_limit()
821+
max_result_window = MAX_LIMIT
822822

823823
size_limit = min(limit + 1, max_result_window)
824824

stac_fastapi/opensearch/stac_fastapi/opensearch/database_logic.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717

1818
from stac_fastapi.core.base_database_logic import BaseDatabaseLogic
1919
from stac_fastapi.core.serializers import CollectionSerializer, ItemSerializer
20-
from stac_fastapi.core.utilities import bbox2polygon, get_bool_env, get_max_limit
20+
from stac_fastapi.core.utilities import MAX_LIMIT, bbox2polygon, get_bool_env
2121
from stac_fastapi.extensions.core.transaction.request import (
2222
PartialCollection,
2323
PartialItem,
@@ -810,7 +810,7 @@ async def execute_search(
810810

811811
search_body["sort"] = sort if sort else DEFAULT_SORT
812812

813-
max_result_window = get_max_limit()
813+
max_result_window = MAX_LIMIT
814814

815815
size_limit = min(limit + 1, max_result_window)
816816

stac_fastapi/tests/api/test_api.py

Lines changed: 64 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -1475,70 +1475,102 @@ def create_items(date_prefix: str, start_day: int, count: int) -> dict:
14751475

14761476

14771477
@pytest.mark.asyncio
1478-
async def test_collections_limit_env_variable(app_client, txn_client, load_test_data):
1479-
limit = "5"
1480-
os.environ["STAC_ITEM_LIMIT"] = limit
1481-
item = load_test_data("test_collection.json")
1478+
async def test_global_collection_max_limit_set(app_client, txn_client, load_test_data):
1479+
"""Test with global collection max limit set, expect cap the limit"""
1480+
os.environ["STAC_GLOBAL_COLLECTION_MAX_LIMIT"] = "5"
14821481

14831482
for i in range(10):
1484-
test_collection = item.copy()
1485-
test_collection["id"] = f"test-collection-env-{i}"
1486-
test_collection["title"] = f"Test Collection Env {i}"
1483+
test_collection = load_test_data("test_collection.json")
1484+
test_collection_id = f"test-collection-global-{i}"
1485+
test_collection["id"] = test_collection_id
1486+
await create_collection(txn_client, test_collection)
1487+
1488+
resp = await app_client.get("/collections?limit=10")
1489+
assert resp.status_code == 200
1490+
resp_json = resp.json()
1491+
assert len(resp_json["collections"]) == 5
1492+
1493+
del os.environ["STAC_GLOBAL_COLLECTION_MAX_LIMIT"]
1494+
1495+
1496+
@pytest.mark.asyncio
1497+
async def test_default_collection_limit(app_client, txn_client, load_test_data):
1498+
"""Test default collection limit set, should use default when no limit provided"""
1499+
os.environ["STAC_DEFAULT_COLLECTION_LIMIT"] = "5"
1500+
1501+
for i in range(10):
1502+
test_collection = load_test_data("test_collection.json")
1503+
test_collection_id = f"test-collection-default-{i}"
1504+
test_collection["id"] = test_collection_id
14871505
await create_collection(txn_client, test_collection)
14881506

14891507
resp = await app_client.get("/collections")
14901508
assert resp.status_code == 200
14911509
resp_json = resp.json()
1492-
assert int(limit) == len(resp_json["collections"])
1510+
assert len(resp_json["collections"]) == 5
1511+
1512+
del os.environ["STAC_DEFAULT_COLLECTION_LIMIT"]
14931513

14941514

14951515
@pytest.mark.asyncio
1496-
async def test_search_collection_limit_env_variable(
1497-
app_client, txn_client, load_test_data
1498-
):
1499-
limit = "5"
1500-
os.environ["STAC_ITEM_LIMIT"] = limit
1516+
async def test_no_global_item_max_limit_set(app_client, txn_client, load_test_data):
1517+
"""Test with no global max limit set for items"""
1518+
1519+
if "STAC_GLOBAL_ITEM_MAX_LIMIT" in os.environ:
1520+
del os.environ["STAC_GLOBAL_ITEM_MAX_LIMIT"]
15011521

15021522
test_collection = load_test_data("test_collection.json")
1503-
test_collection_id = "test-collection-search-limit"
1523+
test_collection_id = "test-collection-no-global-limit"
15041524
test_collection["id"] = test_collection_id
15051525
await create_collection(txn_client, test_collection)
15061526

15071527
item = load_test_data("test_item.json")
15081528
item["collection"] = test_collection_id
15091529

1510-
for i in range(10):
1530+
for i in range(20):
15111531
test_item = item.copy()
1512-
test_item["id"] = f"test-item-search-{i}"
1532+
test_item["id"] = f"test-item-{i}"
15131533
await create_item(txn_client, test_item)
15141534

1515-
resp = await app_client.get("/search", params={"collections": [test_collection_id]})
1535+
resp = await app_client.get(f"/collections/{test_collection_id}/items?limit=20")
1536+
assert resp.status_code == 200
1537+
resp_json = resp.json()
1538+
assert len(resp_json["features"]) == 20
1539+
1540+
resp = await app_client.get(f"/search?collections={test_collection_id}&limit=20")
15161541
assert resp.status_code == 200
15171542
resp_json = resp.json()
1518-
assert int(limit) == len(resp_json["features"])
1543+
assert len(resp_json["features"]) == 20
15191544

1545+
resp = await app_client.post(
1546+
"/search", json={"collections": [test_collection_id], "limit": 20}
1547+
)
1548+
assert resp.status_code == 200
1549+
resp_json = resp.json()
1550+
assert len(resp_json["features"]) == 20
15201551

1521-
async def test_search_max_item_limit(
1522-
app_client, load_test_data, txn_client, monkeypatch
1523-
):
1524-
limit = "10"
1525-
monkeypatch.setenv("ENV_MAX_LIMIT", limit)
15261552

1527-
test_collection = load_test_data("test_collection.json")
1528-
await create_collection(txn_client, test_collection)
1553+
@pytest.mark.asyncio
1554+
async def test_no_global_collection_max_limit_set(
1555+
app_client, txn_client, load_test_data
1556+
):
1557+
"""Test with no global max limit set for collections"""
15291558

1530-
item = load_test_data("test_item.json")
1559+
if "STAC_GLOBAL_COLLECTION_MAX_LIMIT" in os.environ:
1560+
del os.environ["STAC_GLOBAL_COLLECTION_MAX_LIMIT"]
15311561

1562+
test_collections = []
15321563
for i in range(20):
1533-
test_item = item.copy()
1534-
test_item["id"] = f"test-item-collection-{i}"
1535-
await create_item(txn_client, test_item)
1536-
1537-
resp = await app_client.get("/search", params={"limit": 20})
1564+
test_collection = load_test_data("test_collection.json")
1565+
test_collection_id = f"test-collection-no-global-limit-{i}"
1566+
test_collection["id"] = test_collection_id
1567+
await create_collection(txn_client, test_collection)
1568+
test_collections.append(test_collection_id)
15381569

1570+
resp = await app_client.get("/collections?limit=20")
15391571
assert resp.status_code == 200
15401572
resp_json = resp.json()
1541-
assert int(limit) == len(resp_json["features"])
1573+
assert len(resp_json["collections"]) == 20
15421574

15431575

15441576
@pytest.mark.asyncio

0 commit comments

Comments
 (0)