Source code for eth_defi.provider.fallback

"""JSON-RPC provider fallback and redundancy mechanisms.

- See :py:class:`FallbackProvider`
"""
import enum
import time
from collections import defaultdict, Counter
from typing import List, Any, cast, Dict
import logging

from web3 import Web3
from web3.types import RPCEndpoint, RPCResponse

from eth_defi.middleware import is_retryable_http_exception, DEFAULT_RETRYABLE_EXCEPTIONS, DEFAULT_RETRYABLE_HTTP_STATUS_CODES, DEFAULT_RETRYABLE_RPC_ERROR_CODES, ProbablyNodeHasNoBlock
from eth_defi.provider.named import BaseNamedProvider, NamedProvider, get_provider_name

logger = logging.getLogger(__name__)


[docs]class FallbackStrategy(enum.Enum):
    """Different supported fallback strategies."""

    #: Automatically switch to the next provider on an error
    #:
    cycle_on_error = "cycle_on_error"


[docs]class FallbackProvider(BaseNamedProvider):
    """Fault-tolerance for JSON-RPC requests with multiple providers.

    Fall back to the next provider on the list if a JSON-RPC request fails.
    Contains build-in retry logic in round-robin manner.
    We will also recover from situations when we suspect the node does not
    have the block data we are asking yet (but should have shorty).

    See also

    - :py:func:`eth_defi.middlware.exception_retry_middleware`

    - :py:func:`eth_defi.middlware.ProbablyNodeHasNoBlock`

    .. note::

        :py:class:`FallbackProvider` does not call any middlewares installed on the providers themselves.
    """

[docs]    def __init__(
        self,
        providers: List[NamedProvider],
        strategy=FallbackStrategy.cycle_on_error,
        retryable_exceptions=DEFAULT_RETRYABLE_EXCEPTIONS,
        retryable_status_codes=DEFAULT_RETRYABLE_HTTP_STATUS_CODES,
        retryable_rpc_error_codes=DEFAULT_RETRYABLE_RPC_ERROR_CODES,
        sleep: float = 5.0,
        backoff: float = 1.6,
        retries: int = 6,
        state_missing_switch_over_delay: float = 12.0,
        switchover_noisiness=logging.WARNING,
    ):
        """
        :param providers:
            List of provider we cycle through.

        :param strategy:
            What is the strategy to deal with errors.

            Currently on cycling supported.

        :param retryable_exceptions:
            List of exceptions we can retry.

        :param retryable_status_codes:
            List of HTTP status codes we can retry.

        :param retryable_rpc_error_codes:
            List of GoEthereum error codes we can retry.

        :param sleep:
            Seconds between retries.

        :param backoff:
            Multiplier to increase sleep.

        :param retries:
            How many retries we attempt before giving up.

        :param switchover_noisiness:
            How loud we are about switchover issues.

        :param state_missing_switch_over_delay:
            If we encounter state missing condition at node, what is the minimum time (seconds) we wait before trying to switch to next node.

            See code comments for details.

        """

        super().__init__()

        self.providers = providers

        for provider in providers:
            assert "http_retry_request" not in provider.middlewares, "http_retry_request middleware cannot be used with FallbackProvider"

        #: Currently active provider
        self.currently_active_provider = 0

        self.strategy = strategy

        self.retryable_exceptions = retryable_exceptions
        self.retryable_status_codes = retryable_status_codes
        self.retryable_rpc_error_codes = retryable_rpc_error_codes
        self.sleep = sleep
        self.backoff = backoff
        self.retries = retries

        #: provider number -> API name -> call count mappings.
        # This tracks completed API requests.
        self.api_call_counts = defaultdict(Counter)

        #: provider number-> api method name -> retry counts dict
        self.api_retry_counts = defaultdict(Counter)

        self.retry_count = 0
        self.switchover_noisiness = switchover_noisiness

        # Wait 12 seconds for block missing errors
        self.state_missing_switch_over_delay = 12.0

    def __repr__(self):
        names = [get_provider_name(p) for p in self.providers]
        return f"<Fallback provider {', '.join(names)}>"

    @property
    def endpoint_uri(self):
        """Return the active node URI endpoint.

        For :py:class:`HTTPProvider` compatibility.
        """
        return self.get_active_provider().endpoint_uri

[docs]    def has_multiple_providers(self) -> bool:
        """Have we configured multiple providers"""
        return len(self.providers) >= 2

[docs]    def switch_provider(self):
        """Switch to next available provider."""
        provider = self.get_active_provider()
        old_provider_name = get_provider_name(provider)
        self.currently_active_provider = (self.currently_active_provider + 1) % len(self.providers)
        new_provider_name = get_provider_name(self.get_active_provider())
        if old_provider_name != new_provider_name:
            logger.log(self.switchover_noisiness, "Switched RPC providers %s -> %s\n", old_provider_name, new_provider_name)
        else:
            logger.log(self.switchover_noisiness, "Only 1 RPC provider configured: %s, cannot switch, sleeping and hoping the issue resolves itself", old_provider_name)

[docs]    def get_active_provider(self) -> NamedProvider:
        """Get currently active provider.

        If this provider fails, we are automatically recycled to the next one.
        """
        return self.providers[self.currently_active_provider]

[docs]    def get_total_api_call_counts(self) -> Dict[str, int]:
        """Get API call coubst across all providers"""
        total = Counter()
        for provider, count_dict in self.api_call_counts.items():
            for method, count in count_dict.items():
                total[method] += count
        return total

[docs]    def make_request(self, method: RPCEndpoint, params: Any) -> RPCResponse:
        """Make a request.

        - By default use the current active provider

        - If there are errors try cycle through providers and sleep
          between cycles until one provider works
        """
        current_sleep = self.sleep
        for i in range(self.retries + 1):
            provider = self.get_active_provider()
            try:
                # Call the underlying provider
                resp_data = provider.make_request(method, params)

                # We need to manually raise the exception here,
                # likely was raised by Web3.py itself in pre-6.0 versions.
                # If this behavior is some legacy Web3.py behavior and not present anymore,
                # we should replace this with a custom exception.
                # Might be also related to EthereumTester only code paths.
                if "error" in resp_data:
                    # {'jsonrpc': '2.0', 'id': 23, 'error': {'code': -32003, 'message': 'nonce too low'}}
                    # This will trigger exception that will be handled by is_retryable_http_exception()
                    raise ValueError(resp_data["error"])

                _check_faulty_rpc_response(method, params, resp_data)

                # Track API counts
                self.api_call_counts[self.currently_active_provider][method] += 1

                return resp_data

            except Exception as e:
                if is_retryable_http_exception(e, retryable_rpc_error_codes=self.retryable_rpc_error_codes, retryable_status_codes=self.retryable_status_codes, retryable_exceptions=self.retryable_exceptions, method=method, params=params):
                    if self.has_multiple_providers():
                        self.switch_provider()

                    if i < self.retries:
                        # Black messes up string new lines here
                        # See https://github.com/psf/black/issues/1837
                        logger.log(self.switchover_noisiness, "Encountered JSON-RPC retryable error %s\n When calling method: %s%s\n " "Retrying in %f seconds, retry #%d / %d", e, method, params, current_sleep, i + 1, self.retries)
                        time.sleep(current_sleep)
                        current_sleep *= self.backoff
                        self.retry_count += 1
                        self.api_retry_counts[self.currently_active_provider][method] += 1
                        continue
                    else:
                        raise  # Out of retries
                logger.info("Will not retry, method %s, as not a retryable exception %s: %s", method, e.__class__, e)
                raise  # Not retryable exception

        raise AssertionError("Should never be reached")


def _check_faulty_rpc_response(
    method: str,
    params: list,
    resp_data: dict,
):
    """Raise an exception on certain bad result conditions.

    We cannot raise this exception during the result format phase,
    because we are outside the fallover logic.
    """

    # A special case of eth_call returning empty result.
    # This happens if you call a smart contract for a block number
    # for which the node does not yet have a data or is still processing data.
    # This happens often on low-quality RPC providers (Ankr)
    # that route your call between different nodes between subsequent calls and those nodes
    # see a different state of EVM.
    # Down the line, not in middleware stack, this would lead to BadFunctionCallOutput
    # output. We work around this by detecting this conditino in middleware
    # stack and trigger middleware fallover node switch if the condition is detected.
    #
    if method == "eth_call":
        args, block_identifier = params
        if block_identifier != "latest":
            result = resp_data["result"]
            if result == "0x":
                # eth_call returned empty response,
                # assume node does not have data yet,
                # switch to another node, wait some extra time
                # to ensure it gets blocks
                # current_sleep = max(self.state_missing_switch_over_delay, current_sleep)
                raise ProbablyNodeHasNoBlock(f"Node lacked state data when doing eth_call for block {block_identifier}")

    # BlockNotFound exception gets applied only later with the formatters,
    # so we need to trigger fallover here.
    # LlamaNodes.com: web3.exceptions.BlockNotFound: Block with id: '0x2e4d582' not found.
    if method in (
        "eth_getBlockByNumber",
        "eth_getBlockByHash",
    ):
        block_identifier, *other_args = params
        result = resp_data["result"]
        if result in ("0x", None):
            # eth_call returned empty response,
            # assume node does not have data yet,
            # switch to another node, wait some extra time
            # to ensure it gets blocks
            # current_sleep = max(self.state_missing_switch_over_delay, current_sleep)
            raise ProbablyNodeHasNoBlock(f"Node did not have data for block {block_identifier} when calling {method}")


[docs]def get_fallback_provider(web3: Web3) -> FallbackProvider:
    """Get the fallback provider of a Wen3 instance.

    Can be nested in :py:class:`eth_defi.provider.mev_block.MEVBlockerProvider`.

    :param web3:
        Web3 instance

    :raise AssertionError:
        If there is no fallback provider available
    """
    provider = web3.provider
    if isinstance(provider, FallbackProvider):
        return cast(FallbackProvider, provider)

    # MEVBlockerProvider
    call_provider = getattr(provider, "call_provider", None)
    if call_provider:
        return cast(FallbackProvider, call_provider)

    raise AssertionError(f"Does not know how fallback provider is configured: {[provider]}")