forked from amundsen-io/amundsendatabuilder
-
Notifications
You must be signed in to change notification settings - Fork 0
/
mode_paginated_rest_api_query.py
71 lines (55 loc) · 2.57 KB
/
mode_paginated_rest_api_query.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
# Copyright Contributors to the Amundsen project.
# SPDX-License-Identifier: Apache-2.0
import logging
from typing import Any, Dict
import requests
from jsonpath_rw import parse
from databuilder.rest_api.rest_api_query import RestApiQuery
# How many records considers as full and indicating there might be next page? In list reports on space API, it's 30.
DEFAULT_MAX_RECORD_SIZE = 30
PAGE_SUFFIX_TEMPLATE = '?page={}'
LIST_REPORTS_PAGINATION_JSON_PATH = '_embedded.reports[*]' # So far this is the only paginated API that we need.
LOGGER = logging.getLogger(__name__)
class ModePaginatedRestApiQuery(RestApiQuery):
"""
Certain API such as get list of reports on a space is paginated with query term page.
https://mode.com/developer/api-cookbook/management/get-all-reports/
This subclass makes sure to detect if there's more page and update URL to get next page.
"""
def __init__(self,
pagination_json_path: str = LIST_REPORTS_PAGINATION_JSON_PATH,
max_record_size: int = DEFAULT_MAX_RECORD_SIZE,
**kwargs: Any
):
# type (...) -> None
super(ModePaginatedRestApiQuery, self).__init__(**kwargs)
self._original_url = self._url
self._max_record_size = max_record_size
self._current_page = 1
self._pagination_jsonpath_expr = parse(pagination_json_path)
def _preprocess_url(self,
record: Dict[str, Any],
) -> str:
"""
Updates URL with page information
:param record:
:return: a URL that is ready to be called.
"""
page_suffix = PAGE_SUFFIX_TEMPLATE.format(self._current_page) # example: ?page=2
# example: http://foo.bar/resources?page=2
self._url = f"{self._original_url}{page_suffix}"
return self._url.format(**record)
def _post_process(self, response: requests.Response, ) -> None:
"""
Updates trigger to pagination (self._more_pages) as well as current_page (self._current_page)
Mode does not have explicit indicator that it just the number of records need to be certain number that
implying that there could be more records on next page.
:return:
"""
result_list = [match.value for match in self._pagination_jsonpath_expr.find(response.json())]
if result_list and len(result_list) >= self._max_record_size:
self._more_pages = True
self._current_page = self._current_page + 1
return
self._more_pages = False
self._current_page = 1