Use http_retry decorator from swh.core.retry module
The http_retry decorator has been moved to swh-core package in order to ease its reuse across swh packages.
This commit is contained in:
parent
1ee549fc9d
commit
4f57e84450
13 changed files with 32 additions and 201 deletions
|
@ -1,16 +1,10 @@
|
|||
# Copyright (C) 2018-2022 the Software Heritage developers
|
||||
# Copyright (C) 2018-2023 the Software Heritage developers
|
||||
# License: GNU General Public License version 3, or any later version
|
||||
# See top-level LICENSE file for more information
|
||||
|
||||
from typing import Callable, Iterator, Optional, Tuple
|
||||
from typing import Iterator, Optional, Tuple
|
||||
import urllib.parse
|
||||
|
||||
from requests.exceptions import ConnectionError, HTTPError
|
||||
from requests.status_codes import codes
|
||||
from tenacity import retry as tenacity_retry
|
||||
from tenacity.stop import stop_after_attempt
|
||||
from tenacity.wait import wait_exponential
|
||||
|
||||
|
||||
def split_range(total_pages: int, nb_pages: int) -> Iterator[Tuple[int, int]]:
|
||||
"""Split `total_pages` into mostly `nb_pages` ranges. In some cases, the last range can
|
||||
|
@ -36,84 +30,6 @@ def split_range(total_pages: int, nb_pages: int) -> Iterator[Tuple[int, int]]:
|
|||
yield index, total_pages
|
||||
|
||||
|
||||
def is_throttling_exception(e: Exception) -> bool:
|
||||
"""
|
||||
Checks if an exception is a requests.exception.HTTPError for
|
||||
a response with status code 429 (too many requests).
|
||||
"""
|
||||
return (
|
||||
isinstance(e, HTTPError) and e.response.status_code == codes.too_many_requests
|
||||
)
|
||||
|
||||
|
||||
def is_retryable_exception(e: Exception) -> bool:
|
||||
"""
|
||||
Checks if an exception is worth retrying (connection, throttling or a server error).
|
||||
"""
|
||||
is_connection_error = isinstance(e, ConnectionError)
|
||||
is_500_error = isinstance(e, HTTPError) and e.response.status_code >= 500
|
||||
|
||||
return is_connection_error or is_throttling_exception(e) or is_500_error
|
||||
|
||||
|
||||
def retry_if_exception(retry_state, predicate: Callable[[Exception], bool]) -> bool:
|
||||
"""
|
||||
Custom tenacity retry predicate for handling exceptions with the given predicate.
|
||||
"""
|
||||
attempt = retry_state.outcome
|
||||
if attempt.failed:
|
||||
exception = attempt.exception()
|
||||
return predicate(exception)
|
||||
return False
|
||||
|
||||
|
||||
def retry_policy_generic(retry_state) -> bool:
|
||||
"""
|
||||
Custom tenacity retry predicate for handling failed requests:
|
||||
- ConnectionError
|
||||
- Server errors (status >= 500)
|
||||
- Throttling errors (status == 429)
|
||||
|
||||
This does not handle 404, 403 or other status codes.
|
||||
"""
|
||||
return retry_if_exception(retry_state, is_retryable_exception)
|
||||
|
||||
|
||||
WAIT_EXP_BASE = 10
|
||||
MAX_NUMBER_ATTEMPTS = 5
|
||||
|
||||
|
||||
def http_retry(
|
||||
retry=retry_policy_generic,
|
||||
wait=wait_exponential(exp_base=WAIT_EXP_BASE),
|
||||
stop=stop_after_attempt(max_attempt_number=MAX_NUMBER_ATTEMPTS),
|
||||
**retry_args,
|
||||
):
|
||||
"""
|
||||
Decorator based on `tenacity` for retrying a function possibly raising
|
||||
requests.exception.HTTPError for status code 429 (too many requests).
|
||||
|
||||
It provides a default configuration that should work properly in most
|
||||
cases but all `tenacity.retry` parameters can also be overridden in client
|
||||
code.
|
||||
|
||||
When the mmaximum of attempts is reached, the HTTPError exception will then
|
||||
be reraised.
|
||||
|
||||
Args:
|
||||
retry: function defining request retry condition (default to 429 status code)
|
||||
https://tenacity.readthedocs.io/en/latest/#whether-to-retry
|
||||
|
||||
wait: function defining wait strategy before retrying (default to exponential
|
||||
backoff) https://tenacity.readthedocs.io/en/latest/#waiting-before-retrying
|
||||
|
||||
stop: function defining when to stop retrying (default after 5 attempts)
|
||||
https://tenacity.readthedocs.io/en/latest/#stopping
|
||||
|
||||
"""
|
||||
return tenacity_retry(retry=retry, wait=wait, stop=stop, reraise=True, **retry_args)
|
||||
|
||||
|
||||
def is_valid_origin_url(url: Optional[str]) -> bool:
|
||||
"""Returns whether the given string is a valid origin URL.
|
||||
This excludes Git SSH URLs and pseudo-URLs (eg. ``ssh://git@example.org:foo``
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue