From dd084a9ab62dcfdd3aacd39da69f74b8652047f7 Mon Sep 17 00:00:00 2001 From: Pete Gadomski Date: Fri, 20 Jan 2023 11:50:35 -0700 Subject: [PATCH] fix: empty pages for collections and features --- pystac_client/stac_api_io.py | 4 +- tests/test_stac_api_io.py | 82 ++++++++++++++++++++++++++---------- 2 files changed, 63 insertions(+), 23 deletions(-) diff --git a/pystac_client/stac_api_io.py b/pystac_client/stac_api_io.py index ec2d9747..46e3321a 100644 --- a/pystac_client/stac_api_io.py +++ b/pystac_client/stac_api_io.py @@ -227,6 +227,8 @@ def get_pages( Dict[str, Any] : JSON content from a single page """ page = self.read_json(url, method=method, parameters=parameters) + if not (page.get("features") or page.get("collections")): + return None yield page next_link = next( @@ -235,7 +237,7 @@ def get_pages( while next_link: link = Link.from_dict(next_link) page = self.read_json(link, parameters=parameters) - if not page.get("features", False): + if not (page.get("features", False) or page.get("collections")): return None yield page diff --git a/tests/test_stac_api_io.py b/tests/test_stac_api_io.py index 4bfb2865..8eb56ce9 100644 --- a/tests/test_stac_api_io.py +++ b/tests/test_stac_api_io.py @@ -169,75 +169,113 @@ def test_write(self, tmp_path: Path) -> None: data = file.read() assert data == "Hi there!" - def test_stop_on_empty_page(self, requests_mock: Mocker) -> None: + @pytest.mark.parametrize( + ("attribute", "endpoint"), + (("features", "search"), ("collections", "collections")), + ) + def test_stop_on_empty_page( + self, requests_mock: Mocker, attribute: str, endpoint: str + ) -> None: + url = f"https://pystac-client.test/{endpoint}" requests_mock.get( - "https://pystac-client.test/search", + url, status_code=200, json={ - "features": [{"foo": "bar"}], + attribute: [{"foo": "bar"}], "links": [ { "rel": "next", - "href": "https://pystac-client.test/search?token=baz", + "href": url + "?token=baz", } ], }, ) requests_mock.get( - "https://pystac-client.test/search?token=baz", + url + "?token=baz", status_code=200, json={ - "features": [], + attribute: [], "links": [ { "rel": "next", - "href": "https://pystac-client.test/search?token=baw", + "href": url + "?token=bam", } ], }, ) requests_mock.get( - "https://pystac-client.test/search?token=baw", + url + "?token=bam", status_code=500, - json={}, ) stac_api_io = StacApiIO() - pages = list(stac_api_io.get_pages("https://pystac-client.test/search")) + pages = list(stac_api_io.get_pages(url)) assert len(pages) == 1 - assert pages[0]["features"][0]["foo"] == "bar" - - def test_stop_on_featureless_page(self, requests_mock: Mocker) -> None: + assert pages[0][attribute][0]["foo"] == "bar" + + @pytest.mark.parametrize( + ("attribute", "endpoint"), + (("features", "search"), ("collections", "collections")), + ) + def test_stop_on_attributeless_page( + self, requests_mock: Mocker, attribute: str, endpoint: str + ) -> None: + url = f"https://pystac-client.test/{endpoint}" requests_mock.get( - "https://pystac-client.test/search", + url, status_code=200, json={ - "features": [{"foo": "bar"}], + attribute: [{"foo": "bar"}], "links": [ { "rel": "next", - "href": "https://pystac-client.test/search?token=baz", + "href": url + "?token=baz", } ], }, ) requests_mock.get( - "https://pystac-client.test/search?token=baz", + url + "?token=baz", status_code=200, json={ "links": [ { "rel": "next", - "href": "https://pystac-client.test/search?token=baw", + "href": url + "?token=bam", } ], }, ) requests_mock.get( - "https://pystac-client.test/search?token=baw", + url + "?token=bam", status_code=500, - json={}, ) stac_api_io = StacApiIO() - pages = list(stac_api_io.get_pages("https://pystac-client.test/search")) + pages = list(stac_api_io.get_pages(url)) assert len(pages) == 1 - assert pages[0]["features"][0]["foo"] == "bar" + assert pages[0][attribute][0]["foo"] == "bar" + + @pytest.mark.parametrize( + ("attribute", "endpoint"), + (("features", "search"), ("collections", "collections")), + ) + def test_stop_on_first_empty_page( + self, requests_mock: Mocker, attribute: str, endpoint: str + ) -> None: + url = f"https://pystac-client.test/{endpoint}" + requests_mock.get( + url, + status_code=200, + json={ + attribute: [], + "links": [ + { + "rel": "next", + "href": url + "?token=bam", + } + ], + }, + ) + requests_mock.get(url + "?token=bam", status_code=500) + stac_api_io = StacApiIO() + pages = list(stac_api_io.get_pages(url)) + assert len(pages) == 0