Skip to content
This repository has been archived by the owner on Oct 10, 2024. It is now read-only.

Commit

Permalink
add support for new expanded param in paged_articles (fix mediaclou…
Browse files Browse the repository at this point in the history
  • Loading branch information
rahulbot committed Dec 8, 2023
1 parent cb03fbc commit 7174240
Show file tree
Hide file tree
Showing 2 changed files with 17 additions and 1 deletion.
5 changes: 4 additions & 1 deletion waybacknews/searchapi.py
Original file line number Diff line number Diff line change
Expand Up @@ -118,11 +118,14 @@ def all_articles(self, query: str, start_date: dt.datetime, end_date: dt.datetim
more_pages = True

def paged_articles(self, query: str, start_date: dt.datetime, end_date: dt.datetime,
page_size: Optional[int] = 1000, pagination_token: Optional[str] = None, **kwargs):
page_size: Optional[int] = 1000, expanded: bool = False,
pagination_token: Optional[str] = None, **kwargs):
"""
@return: one page of stories
"""
params = {"q": "{} AND {}".format(query, self._date_query_clause(start_date, end_date))}
if expanded:
params['expanded'] = 1
if pagination_token:
params['resume'] = pagination_token
params.update(kwargs)
Expand Down
13 changes: 13 additions & 0 deletions waybacknews/tests/test_waybacknews.py
Original file line number Diff line number Diff line change
Expand Up @@ -122,6 +122,19 @@ def test_paged_articles(self):
page2_urls = [s['url'] for s in page2]
assert page1_url1 not in page2_urls # verify pages don't overlap

def test_paged_expanded_articles(self):
query = "biden"
start_date = dt.datetime(2023, 11, 25)
end_date = dt.datetime(2023, 11, 26)
page1, next_token1 = self._api.paged_articles(query, start_date, end_date)
for s in page1:
assert 'text_content' not in s
page2, next_token2 = self._api.paged_articles(query, start_date, end_date,
pagination_token=next_token1, expanded=True)
for s in page2:
assert 'text_content' in s


def test_top_sources(self):
results = self._api.top_sources("coronavirus", dt.datetime(2022, 3, 1), dt.datetime(2022, 4, 1))
assert len(results) > 0
Expand Down

0 comments on commit 7174240

Please sign in to comment.