2017-02-21 16:27:49 -08:00
|
|
|
'''
|
2017-02-28 16:23:59 -08:00
|
|
|
doublethink/rethinker.py - rethinkdb connection-manager
|
2017-02-21 16:27:49 -08:00
|
|
|
|
2023-05-18 17:16:04 -07:00
|
|
|
Copyright (C) 2015-2023 Internet Archive
|
2017-02-21 16:27:49 -08:00
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
'''
|
|
|
|
|
2023-05-18 17:16:04 -07:00
|
|
|
import rethinkdb as rdb
|
2017-02-21 16:27:49 -08:00
|
|
|
import logging
|
|
|
|
import random
|
|
|
|
import time
|
|
|
|
import types
|
2017-05-01 14:01:01 -07:00
|
|
|
import re
|
2017-02-21 16:27:49 -08:00
|
|
|
|
2023-05-18 17:16:04 -07:00
|
|
|
r = rdb.RethinkDB()
|
|
|
|
|
2017-02-21 16:27:49 -08:00
|
|
|
class RethinkerWrapper(object):
|
2017-02-28 16:23:59 -08:00
|
|
|
logger = logging.getLogger('doublethink.RethinkerWrapper')
|
2017-03-01 11:20:27 -08:00
|
|
|
def __init__(self, rr, wrapped):
|
|
|
|
self.rr = rr
|
2017-02-21 16:27:49 -08:00
|
|
|
self.wrapped = wrapped
|
|
|
|
|
|
|
|
def __getattr__(self, name):
|
|
|
|
delegate = getattr(self.wrapped, name)
|
2017-03-01 11:20:27 -08:00
|
|
|
return self.rr.wrap(delegate)
|
2017-02-21 16:27:49 -08:00
|
|
|
|
|
|
|
def __getitem__(self, key):
|
2017-03-01 11:20:27 -08:00
|
|
|
return self.rr.wrap(self.wrapped.__getitem__)(key)
|
2017-02-21 16:27:49 -08:00
|
|
|
|
|
|
|
def __repr__(self):
|
|
|
|
return '<RethinkerWrapper{}>'.format(repr(self.wrapped))
|
|
|
|
|
2018-09-27 12:56:30 -07:00
|
|
|
def _result_iter(self, conn, result):
|
|
|
|
error_count = 0
|
|
|
|
try:
|
|
|
|
yield # empty yield, see comment below
|
|
|
|
while True:
|
|
|
|
try:
|
|
|
|
yield next(result)
|
|
|
|
except StopIteration:
|
|
|
|
break
|
|
|
|
except r.ReqlOpFailedError as e:
|
|
|
|
if e.args and re.match(
|
|
|
|
'^Cannot perform.*replica.*', e.args[0]):
|
|
|
|
if error_count < 20:
|
|
|
|
error_count += 1
|
2019-05-16 23:29:55 +00:00
|
|
|
self.logger.warning(
|
2018-09-27 12:56:30 -07:00
|
|
|
'will keep trying after potentially '
|
|
|
|
'recoverable error (%s/20): %s',
|
|
|
|
error_count, e)
|
|
|
|
time.sleep(0.5)
|
|
|
|
else:
|
|
|
|
raise
|
|
|
|
else:
|
|
|
|
raise
|
|
|
|
finally:
|
|
|
|
result.close()
|
|
|
|
conn.close()
|
|
|
|
|
2018-09-28 12:27:13 -07:00
|
|
|
def run(self, db=None, **kwargs):
|
2017-02-21 16:27:49 -08:00
|
|
|
self.wrapped.run # raise AttributeError early
|
|
|
|
while True:
|
2017-03-01 11:20:27 -08:00
|
|
|
conn = self.rr._random_server_connection()
|
2017-02-21 16:27:49 -08:00
|
|
|
is_iter = False
|
|
|
|
try:
|
2018-09-28 12:27:13 -07:00
|
|
|
result = self.wrapped.run(
|
|
|
|
conn, db=db or self.rr.dbname, **kwargs)
|
2017-02-21 16:27:49 -08:00
|
|
|
if hasattr(result, '__next__'):
|
|
|
|
is_iter = True
|
2018-09-27 12:56:30 -07:00
|
|
|
g = self._result_iter(conn, result)
|
2017-02-21 16:27:49 -08:00
|
|
|
# Start executing the generator, leaving off after the
|
|
|
|
# empty yield. If we didn't do this, and the caller never
|
|
|
|
# started the generator, the finally block would never run
|
|
|
|
# and the connection would stay open.
|
|
|
|
next(g)
|
|
|
|
return g
|
|
|
|
else:
|
|
|
|
return result
|
|
|
|
except r.ReqlTimeoutError as e:
|
|
|
|
time.sleep(0.5)
|
2017-05-01 14:01:01 -07:00
|
|
|
except r.ReqlOpFailedError as e:
|
|
|
|
if e.args and re.match(
|
2017-06-27 10:58:30 -07:00
|
|
|
'^Cannot perform.*replica.*', e.args[0]):
|
2019-05-16 23:29:55 +00:00
|
|
|
self.logger.warning(
|
2017-05-01 14:01:01 -07:00
|
|
|
'will keep trying after potentially recoverable '
|
|
|
|
'error: %s', e)
|
|
|
|
time.sleep(0.5)
|
|
|
|
else:
|
|
|
|
raise
|
2017-02-21 16:27:49 -08:00
|
|
|
finally:
|
|
|
|
if not is_iter:
|
|
|
|
conn.close(noreply_wait=False)
|
|
|
|
|
|
|
|
class Rethinker(object):
|
|
|
|
'''
|
2017-03-01 11:20:27 -08:00
|
|
|
>>> rr = Rethinker(db='my_db')
|
|
|
|
>>> doc = rr.table('my_table').get(1).run()
|
2017-02-21 16:27:49 -08:00
|
|
|
'''
|
2017-02-28 16:23:59 -08:00
|
|
|
logger = logging.getLogger('doublethink.Rethinker')
|
2017-02-21 16:27:49 -08:00
|
|
|
|
|
|
|
def __init__(self, servers=['localhost'], db=None):
|
|
|
|
if isinstance(servers, str):
|
|
|
|
self.servers = [servers]
|
|
|
|
else:
|
|
|
|
self.servers = servers
|
|
|
|
self.dbname = db
|
2018-11-02 18:05:18 +00:00
|
|
|
self.last_error = {} # {server: time}
|
2017-02-21 16:27:49 -08:00
|
|
|
|
|
|
|
# https://github.com/rethinkdb/rethinkdb-example-webpy-blog/blob/master/model.py
|
|
|
|
# "Best practices: Managing connections: a connection per request"
|
|
|
|
def _random_server_connection(self):
|
2018-10-29 13:34:45 -07:00
|
|
|
retry_wait = 0.01
|
2017-02-21 16:27:49 -08:00
|
|
|
while True:
|
2018-11-02 18:05:18 +00:00
|
|
|
server = random.choice(self._server_whitelist())
|
2017-02-21 16:27:49 -08:00
|
|
|
try:
|
|
|
|
try:
|
|
|
|
host, port = server.split(':')
|
2018-11-02 18:05:18 +00:00
|
|
|
return r.connect(host=host, port=port)
|
2017-02-21 16:27:49 -08:00
|
|
|
except ValueError:
|
2018-11-02 18:05:18 +00:00
|
|
|
return r.connect(host=server)
|
2017-02-21 16:27:49 -08:00
|
|
|
except Exception as e:
|
2018-11-02 18:05:18 +00:00
|
|
|
self.last_error[server] = time.time()
|
2019-05-16 23:29:55 +00:00
|
|
|
self.logger.warning(
|
2017-02-21 16:27:49 -08:00
|
|
|
'will keep trying after failure connecting to '
|
2018-11-01 19:17:50 +00:00
|
|
|
'rethinkdb server at %s: %s (sleeping for %s sec)',
|
|
|
|
server, e, retry_wait)
|
2018-10-29 13:34:45 -07:00
|
|
|
time.sleep(retry_wait)
|
|
|
|
retry_wait = min(retry_wait * 2, 10.0)
|
2017-02-21 16:27:49 -08:00
|
|
|
|
2018-11-02 18:05:18 +00:00
|
|
|
# https://en.wikipedia.org/wiki/Penalty_(ice_hockey)#Major_penalty
|
|
|
|
PENALTY_BOX_TIME = 300
|
|
|
|
def _server_whitelist(self):
|
|
|
|
'''
|
|
|
|
Returns list of servers that have not errored in the last five minutes.
|
|
|
|
If all servers have errored in the last five minutes, returns list with
|
|
|
|
one item, the server that errored least recently.
|
|
|
|
'''
|
|
|
|
whitelist = []
|
|
|
|
for server in self.servers:
|
|
|
|
if (server not in self.last_error
|
|
|
|
or self.last_error[server] < time.time() - self.PENALTY_BOX_TIME):
|
|
|
|
whitelist.append(server)
|
|
|
|
if not whitelist:
|
|
|
|
whitelist.append(sorted(
|
|
|
|
self.last_error.items(), key=lambda kv: kv[1])[0][0])
|
|
|
|
return whitelist
|
|
|
|
|
2017-02-21 16:27:49 -08:00
|
|
|
def wrap(self, delegate):
|
|
|
|
if isinstance(delegate, (types.FunctionType, types.MethodType)):
|
|
|
|
def wrapper(*args, **kwargs):
|
|
|
|
result = delegate(*args, **kwargs)
|
|
|
|
if result is not None:
|
|
|
|
return RethinkerWrapper(self, result)
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
return wrapper
|
|
|
|
else:
|
|
|
|
return delegate
|
|
|
|
|
|
|
|
def __getattr__(self, name):
|
|
|
|
delegate = getattr(r, name)
|
|
|
|
return self.wrap(delegate)
|
|
|
|
|