Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Use fake clock for faster unit tests #533

Merged
merged 6 commits into from
Feb 8, 2024
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
49 changes: 49 additions & 0 deletions databricks/sdk/clock.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,49 @@
import abc
import time


class Clock(metaclass=abc.ABCMeta):

@abc.abstractmethod
def time(self) -> float:
"""
Return the current time in seconds since the Epoch.
Fractions of a second may be present if the system clock provides them.

:return: The current time in seconds since the Epoch.
"""

@abc.abstractmethod
def sleep(self, seconds: float) -> None:
"""
Return the current time in seconds since the Epoch.
Fractions of a second may be present if the system clock provides them.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Don't seem to be accurate?

:param seconds: The duration to sleep in seconds.
:return:
"""


class RealClock(Clock):
"""
A real clock that uses the ``time`` module to get the current time and sleep.
"""

def time(self) -> float:
"""
Return the current time in seconds since the Epoch.
Fractions of a second may be present if the system clock provides them.

:return: The current time in seconds since the Epoch.
"""
return time.time()

def sleep(self, seconds: float) -> None:
"""
Return the current time in seconds since the Epoch.
Fractions of a second may be present if the system clock provides them.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

These lines don't seem to be accurate?

:param seconds: The duration to sleep in seconds.
:return:
"""
time.sleep(seconds)
10 changes: 8 additions & 2 deletions databricks/sdk/core.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@

from requests.adapters import HTTPAdapter

from .clock import Clock, RealClock
from .config import *
# To preserve backwards compatibility (as these definitions were previously in this module)
from .credentials_provider import *
Expand All @@ -22,12 +23,16 @@ class ApiClient:
_cfg: Config
_RETRY_AFTER_DEFAULT: int = 1

def __init__(self, cfg: Config = None):
def __init__(self, cfg: Config = None, clock: Clock = None):

if cfg is None:
cfg = Config()

if clock is None:
clock = RealClock()

self._cfg = cfg
self._clock = clock
# See https://github.com/databricks/databricks-sdk-go/blob/main/client/client.go#L34-L35
self._debug_truncate_bytes = cfg.debug_truncate_bytes if cfg.debug_truncate_bytes else 96
self._retry_timeout_seconds = cfg.retry_timeout_seconds if cfg.retry_timeout_seconds else 300
Expand Down Expand Up @@ -123,7 +128,8 @@ def do(self,
headers = {}
headers['User-Agent'] = self._user_agent_base
retryable = retried(timeout=timedelta(seconds=self._retry_timeout_seconds),
is_retryable=self._is_retryable)
is_retryable=self._is_retryable,
clock=self._clock)
return retryable(self._perform)(method,
path,
query=query,
Expand Down
14 changes: 9 additions & 5 deletions databricks/sdk/retries.py
Original file line number Diff line number Diff line change
@@ -1,30 +1,34 @@
import functools
import logging
import time
from datetime import timedelta
from random import random
from typing import Callable, Optional, Sequence, Type

from .clock import Clock, RealClock

logger = logging.getLogger(__name__)


def retried(*,
on: Sequence[Type[BaseException]] = None,
is_retryable: Callable[[BaseException], Optional[str]] = None,
timeout=timedelta(minutes=20)):
timeout=timedelta(minutes=20),
clock: Clock = None):
has_allowlist = on is not None
has_callback = is_retryable is not None
if not (has_allowlist or has_callback) or (has_allowlist and has_callback):
raise SyntaxError('either on=[Exception] or callback=lambda x: .. is required')
if clock is None:
clock = RealClock()

def decorator(func):

@functools.wraps(func)
def wrapper(*args, **kwargs):
deadline = time.time() + timeout.total_seconds()
deadline = clock.time() + timeout.total_seconds()
attempt = 1
last_err = None
while time.time() < deadline:
while clock.time() < deadline:
try:
return func(*args, **kwargs)
except Exception as err:
Expand All @@ -50,7 +54,7 @@ def wrapper(*args, **kwargs):
raise err

logger.debug(f'Retrying: {retry_reason} (sleeping ~{sleep}s)')
time.sleep(sleep + random())
clock.sleep(sleep + random())
attempt += 1
raise TimeoutError(f'Timed out after {timeout}') from last_err

Expand Down
16 changes: 16 additions & 0 deletions tests/clock.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
from databricks.sdk.clock import Clock


class FakeClock(Clock):
"""
A simple clock that can be used to mock time in tests.
"""

def __init__(self, start_time: float = 0.0):
self._start_time = start_time

def time(self) -> float:
return self._start_time

def sleep(self, seconds: float) -> None:
self._start_time += seconds
13 changes: 7 additions & 6 deletions tests/test_core.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,7 @@
from databricks.sdk.service.iam import AccessControlRequest
from databricks.sdk.version import __version__

from .clock import FakeClock
from .conftest import noop_credentials


Expand Down Expand Up @@ -422,7 +423,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_'))
api_client = ApiClient(Config(host=host, token='_'), clock=FakeClock())
res = api_client.do('GET', '/foo')
assert 'foo' in res

Expand All @@ -445,7 +446,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_'))
api_client = ApiClient(Config(host=host, token='_'), clock=FakeClock())
res = api_client.do('GET', '/foo')
assert 'foo' in res

Expand All @@ -462,7 +463,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_', retry_timeout_seconds=1))
api_client = ApiClient(Config(host=host, token='_', retry_timeout_seconds=1), clock=FakeClock())
with pytest.raises(TimeoutError):
api_client.do('GET', '/foo')

Expand All @@ -484,7 +485,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_'))
api_client = ApiClient(Config(host=host, token='_'), clock=FakeClock())
res = api_client.do('GET', '/foo')
assert 'foo' in res

Expand All @@ -502,7 +503,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_'))
api_client = ApiClient(Config(host=host, token='_'), clock=FakeClock())
with pytest.raises(DatabricksError):
api_client.do('GET', '/foo')

Expand All @@ -520,7 +521,7 @@ def inner(h: BaseHTTPRequestHandler):
requests.append(h.requestline)

with http_fixture_server(inner) as host:
api_client = ApiClient(Config(host=host, token='_'))
api_client = ApiClient(Config(host=host, token='_'), clock=FakeClock())
res = api_client.do('GET', '/foo')
assert 'foo' in res

Expand Down
Loading