Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

TDL-16355 Implement request timeouts #43

Merged
merged 6 commits into from
Dec 20, 2021
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
18 changes: 9 additions & 9 deletions .circleci/config.yml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@ version: 2
jobs:
build:
docker:
- image: 218546966473.dkr.ecr.us-east-1.amazonaws.com/circle-ci:tap-tester-v4
- image: 218546966473.dkr.ecr.us-east-1.amazonaws.com/circle-ci:stitch-tap-tester
steps:
- checkout
- run:
Expand All @@ -12,6 +12,7 @@ jobs:
source /usr/local/share/virtualenvs/tap-mailchimp/bin/activate
pip install -U 'pip<19.2' 'setuptools<51.0.0'
pip install .[dev]
pip install coverage
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Please use latest tap-tester image.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Updated tap-tester image

- run:
name: 'pylint'
command: |
Expand All @@ -27,20 +28,19 @@ jobs:
name: 'Unit Tests'
command: |
source /usr/local/share/virtualenvs/tap-mailchimp/bin/activate
nosetests ./tests/unittests
nosetests --with-coverage --cover-erase --cover-package=tap_mailchimp --cover-html-dir=htmlcov ./tests/unittests
coverage html
- store_test_results:
path: test_output/report.xml
- store_artifacts:
path: htmlcov
- run:
name: 'Integration Tests'
command: |
aws s3 cp s3://com-stitchdata-dev-deployment-assets/environments/tap-tester/sandbox dev_env.sh
source dev_env.sh
source /usr/local/share/virtualenvs/tap-tester/bin/activate
run-test --tap=tap-mailchimp \
--target=target-stitch \
--orchestrator=stitch-orchestrator \
--email=harrison+sandboxtest@stitchdata.com \
--password=$SANDBOX_PASSWORD \
--client-id=50 \
tests
run-test --tap=tap-mailchimp tests
workflows:
version: 2
commit:
Expand Down
1 change: 1 addition & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@ Config properties:
| `dc` | See note. | "us14" | The Mailchimp data center, only requried when using API key auth. |
| `start_date` | Y | "2010-01-01T00:00:00Z" | The default start date to use for date modified replication, when available. |
| `user_agent` | N | "Vandelay Industries ETL Runner" | The user agent to send on every request. |
| `request_timeout` | N | 300 | Time for which request should wait to get response. |

## Usage

Expand Down
16 changes: 14 additions & 2 deletions tap_mailchimp/client.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,12 @@
import backoff
import requests
import singer
from requests.exceptions import ConnectionError # pylint: disable=redefined-builtin
from requests.exceptions import ConnectionError, Timeout # pylint: disable=redefined-builtin
from singer import metrics

LOGGER = singer.get_logger()

REQUEST_TIMEOUT = 300
class ClientRateLimitError(Exception):
pass

Expand All @@ -21,6 +22,13 @@ def __init__(self, config):
self.__base_url = None
self.page_size = int(config.get('page_size', '1000'))

# Set request timeout to config param `request_timeout` value.
# If value is 0,"0","" or not passed then it set default to 300 seconds.
config_request_timeout = config.get('request_timeout')
if config_request_timeout and float(config_request_timeout):
self.__request_timeout = float(config_request_timeout)
else:
self.__request_timeout = REQUEST_TIMEOUT

if not self.__access_token and self.__api_key:
self.__base_url = 'https://{}.api.mailchimp.com'.format(
Expand All @@ -38,6 +46,10 @@ def get_base_url(self):
endpoint='base_url')
self.__base_url = data['api_endpoint']

@backoff.on_exception(backoff.expo,
Timeout, # Backoff for request timeout
max_tries=5,
factor=2)
@backoff.on_exception(backoff.expo,
(Server5xxError, ClientRateLimitError, ConnectionError),
max_tries=6,
Expand Down Expand Up @@ -74,7 +86,7 @@ def request(self, method, path=None, url=None, s3=False, **kwargs):

with metrics.http_request_timer(endpoint) as timer:
LOGGER.info("Executing %s request to %s with params: %s", method, url, kwargs.get('params'))
response = self.__session.request(method, url, **kwargs)
response = self.__session.request(method, url, timeout=self.__request_timeout, **kwargs) # Pass request timeout
timer.tags[metrics.Tag.http_status_code] = response.status_code

if response.status_code >= 500:
Expand Down
136 changes: 136 additions & 0 deletions tests/unittests/test_request_timeouts.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,136 @@
from tap_mailchimp.client import MailchimpClient
import unittest
from unittest.mock import patch
import requests

REQUEST_TIMEOUT_INT = 300
REQUEST_TIMEOUT_STR = "300"
REQUEST_TIMEOUT_FLOAT = 300.0

# Mock response object
def get_mock_http_response(*args, **kwargs):
contents = '{"access_token": "test", "expires_in":100, "accounts":[{"id": 12}]}'
response = requests.Response()
response.status_code = 200
response._content = contents.encode()
return response

@patch("time.sleep")
@patch("requests.Session.request", side_effect=requests.exceptions.Timeout)
class TestRequestTimeoutsBackoff(unittest.TestCase):

def test_request_timeout_backoff(self, mocked_request, mock_sleep):
"""
Verify request function is backoff for 5 times on Timeout exceeption
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as'})
try:
client.request('GET', "http://test", "base_url")
except requests.exceptions.Timeout:
pass

# Verify that requests.Session.request is called 5 times
self.assertEqual(mocked_request.call_count, 5)

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

@prijendev the test case name and the assertion that you are making is different. Can you please verify it?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Yes, updated test case name.


@patch("requests.Session.request", side_effect=get_mock_http_response)
class TestRequestTimeoutsValue(unittest.TestCase):

def test_no_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is not provided in config then default value(300) is used
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as'})

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_INT) # Verify timeout argument

def test_integer_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config(integer value) then it should be use
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as', "request_timeout": REQUEST_TIMEOUT_INT}) # integer timeout in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout.
# If none zero positive integer or string value passed in the config then it converted to float value. So, here we are verifying the same.
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_FLOAT)

def test_float_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config(float value) then it should be use
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as', "request_timeout": REQUEST_TIMEOUT_FLOAT}) # float timeout in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_FLOAT) # Verify timeout argument

def test_string_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config(string value) then it should be use
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as', "request_timeout": REQUEST_TIMEOUT_STR}) # string timeout in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
# If none zero positive integer or string value passed in the config then it converted to float value. So, here we are verifying the same.
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_FLOAT) # Verify timeout argument

def test_empty_string_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config with empty string then default value(300) is used
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as', "request_timeout": ""}) # empty string timeout in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_INT) # Verify timeout argument

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

@prijendev Why int value is expected in this test case?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

If the request_timeout value is not passed in the config then the default value that is int value(300) is used.


def test_zero_int_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config with int zero value then default value(300) is used
"""
# Initialize MailchimpClient object
client = MailchimpClient({'access_token': 'as', "request_timeout": 0}) # int zero value in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_INT) # Verify timeout argument

def test_zero_string_request_timeout_in_config(self, mocked_request):
"""
Verify that if request_timeout is provided in config with string zero in string format then default value(300) is used
"""
client = MailchimpClient({'access_token': 'as', "request_timeout": "0"}) # string zero value in config

# Call request method which call requests.Session.request with timeout
client.request('GET', "http://test", "base_url")

# Verify requests.Session.request is called with expected timeout
args, kwargs = mocked_request.call_args
self.assertEqual(kwargs.get('timeout'), REQUEST_TIMEOUT_INT) # Verify timeout argument