Skip to content

Commit 02a803f

Browse files
authored
implement our own retry logic & logging for event posts, don't use urllib3.Retry (#133)
1 parent f7ec18a commit 02a803f

File tree

2 files changed

+79
-39
lines changed

2 files changed

+79
-39
lines changed

ldclient/event_processor.py

+63-36
Original file line numberDiff line numberDiff line change
@@ -28,9 +28,8 @@
2828
from ldclient.interfaces import EventProcessor
2929
from ldclient.repeating_timer import RepeatingTimer
3030
from ldclient.util import UnsuccessfulResponseException
31-
from ldclient.util import _headers, _retryable_statuses
3231
from ldclient.util import log
33-
from ldclient.util import http_error_message, is_http_error_recoverable, stringify_attrs, throw_if_unsuccessful_response
32+
from ldclient.util import check_if_error_is_recoverable_and_log, is_http_error_recoverable, stringify_attrs, throw_if_unsuccessful_response, _headers
3433
from ldclient.diagnostics import create_diagnostic_init
3534

3635
__MAX_FLUSH_THREADS__ = 5
@@ -141,18 +140,6 @@ def _get_userkey(self, event):
141140
return str(event['user'].get('key'))
142141

143142

144-
class _EventRetry(urllib3.Retry):
145-
def __init__(self):
146-
urllib3.Retry.__init__(self, total=1,
147-
method_whitelist=False, # Enable retry on POST
148-
status_forcelist=_retryable_statuses,
149-
raise_on_status=False)
150-
151-
# Override backoff time to be flat 1 second
152-
def get_backoff_time(self):
153-
return 1
154-
155-
156143
class EventPayloadSendTask(object):
157144
def __init__(self, http, config, formatter, payload, response_fn):
158145
self._http = http
@@ -175,16 +162,17 @@ def _do_send(self, output_events):
175162
try:
176163
json_body = json.dumps(output_events)
177164
log.debug('Sending events payload: ' + json_body)
178-
hdrs = _headers(self._config)
179-
hdrs['X-LaunchDarkly-Event-Schema'] = str(__CURRENT_EVENT_SCHEMA__)
180-
hdrs['X-LaunchDarkly-Payload-ID'] = str(uuid.uuid4())
181-
uri = self._config.events_uri
182-
r = self._http.request('POST', uri,
183-
headers=hdrs,
184-
timeout=urllib3.Timeout(connect=self._config.connect_timeout, read=self._config.read_timeout),
185-
body=json_body,
186-
retries=_EventRetry())
187-
self._response_fn(r)
165+
payload_id = str(uuid.uuid4())
166+
r = _post_events_with_retry(
167+
self._http,
168+
self._config,
169+
self._config.events_uri,
170+
payload_id,
171+
json_body,
172+
"%d events" % len(self._payload.events)
173+
)
174+
if r:
175+
self._response_fn(r)
188176
return r
189177
except Exception as e:
190178
log.warning(
@@ -202,13 +190,14 @@ def run(self):
202190
try:
203191
json_body = json.dumps(self._event_body)
204192
log.debug('Sending diagnostic event: ' + json_body)
205-
hdrs = _headers(self._config)
206-
uri = self._config.events_base_uri + '/diagnostic'
207-
r = self._http.request('POST', uri,
208-
headers=hdrs,
209-
timeout=urllib3.Timeout(connect=self._config.connect_timeout, read=self._config.read_timeout),
210-
body=json_body,
211-
retries=1)
193+
_post_events_with_retry(
194+
self._http,
195+
self._config,
196+
self._config.events_base_uri + '/diagnostic',
197+
None,
198+
json_body,
199+
"diagnostic event"
200+
)
212201
except Exception as e:
213202
log.warning(
214203
'Unhandled exception in event processor. Diagnostic event was not sent. [%s]', e)
@@ -381,11 +370,9 @@ def _handle_response(self, r):
381370
if server_date is not None:
382371
timestamp = int(time.mktime(server_date) * 1000)
383372
self._last_known_past_time = timestamp
384-
if r.status > 299:
385-
log.error(http_error_message(r.status, "event delivery", "some events were dropped"))
386-
if not is_http_error_recoverable(r.status):
387-
self._disabled = True
388-
return
373+
if r.status > 299 and not is_http_error_recoverable(r.status):
374+
self._disabled = True
375+
return
389376

390377
def _send_and_reset_diagnostics(self):
391378
if self._diagnostic_accumulator is not None:
@@ -472,3 +459,43 @@ def __enter__(self):
472459

473460
def __exit__(self, type, value, traceback):
474461
self.stop()
462+
463+
464+
def _post_events_with_retry(
465+
http_client,
466+
config,
467+
uri,
468+
payload_id,
469+
body,
470+
events_description
471+
):
472+
hdrs = _headers(config)
473+
hdrs['Content-Type'] = 'application/json'
474+
if payload_id:
475+
hdrs['X-LaunchDarkly-Event-Schema'] = str(__CURRENT_EVENT_SCHEMA__)
476+
hdrs['X-LaunchDarkly-Payload-ID'] = payload_id
477+
can_retry = True
478+
context = "posting %s" % events_description
479+
while True:
480+
next_action_message = "will retry" if can_retry else "some events were dropped"
481+
try:
482+
r = http_client.request(
483+
'POST',
484+
uri,
485+
headers=hdrs,
486+
body=body,
487+
timeout=urllib3.Timeout(connect=config.connect_timeout, read=config.read_timeout),
488+
retries=0
489+
)
490+
if r.status < 300:
491+
return r
492+
recoverable = check_if_error_is_recoverable_and_log(context, r.status, None, next_action_message)
493+
if not recoverable:
494+
return r
495+
except Exception as e:
496+
check_if_error_is_recoverable_and_log(context, None, str(e), next_action_message)
497+
if not can_retry:
498+
return None
499+
can_retry = False
500+
# fixed delay of 1 second for event retries
501+
time.sleep(1)

ldclient/util.py

+16-3
Original file line numberDiff line numberDiff line change
@@ -89,15 +89,28 @@ def is_http_error_recoverable(status):
8989
return True # all other errors are recoverable
9090

9191

92+
def http_error_description(status):
93+
return "HTTP error %d%s" % (status, " (invalid SDK key)" if (status == 401 or status == 403) else "")
94+
95+
9296
def http_error_message(status, context, retryable_message = "will retry"):
93-
return "Received HTTP error %d%s for %s - %s" % (
94-
status,
95-
" (invalid SDK key)" if (status == 401 or status == 403) else "",
97+
return "Received %s for %s - %s" % (
98+
http_error_description(status),
9699
context,
97100
retryable_message if is_http_error_recoverable(status) else "giving up permanently"
98101
)
99102

100103

104+
def check_if_error_is_recoverable_and_log(error_context, status_code, error_desc, recoverable_message):
105+
if status_code and (error_desc is None):
106+
error_desc = http_error_description(status_code)
107+
if status_code and not is_http_error_recoverable(status_code):
108+
log.error("Error %s (giving up permanently): %s" % (error_context, error_desc))
109+
return False
110+
log.warning("Error %s (%s): %s" % (error_context, recoverable_message, error_desc))
111+
return True
112+
113+
101114
def stringify_attrs(attrdict, attrs):
102115
if attrdict is None:
103116
return None

0 commit comments

Comments
 (0)