mirror of
https://github.com/moparisthebest/SickRage
synced 2025-01-07 11:58:01 -05:00
Replaced cache handler with a modified version of our own, gives quicker Indexer API responses to our requests
This commit is contained in:
parent
ff1e6e6dbc
commit
6a1ccef8d9
13
lib/cachecontrol/__init__.py
Normal file
13
lib/cachecontrol/__init__.py
Normal file
@ -0,0 +1,13 @@
|
|||||||
|
"""CacheControl import Interface.
|
||||||
|
|
||||||
|
Make it easy to import from cachecontrol without long namespaces.
|
||||||
|
"""
|
||||||
|
|
||||||
|
# patch our requests.models.Response to make them pickleable in older
|
||||||
|
# versions of requests.
|
||||||
|
|
||||||
|
import cachecontrol.patch_requests
|
||||||
|
|
||||||
|
from cachecontrol.wrapper import CacheControl
|
||||||
|
from cachecontrol.adapter import CacheControlAdapter
|
||||||
|
from cachecontrol.controller import CacheController
|
75
lib/cachecontrol/adapter.py
Normal file
75
lib/cachecontrol/adapter.py
Normal file
@ -0,0 +1,75 @@
|
|||||||
|
from requests.adapters import HTTPAdapter
|
||||||
|
|
||||||
|
from cachecontrol.controller import CacheController
|
||||||
|
from cachecontrol.cache import DictCache
|
||||||
|
|
||||||
|
|
||||||
|
class CacheControlAdapter(HTTPAdapter):
|
||||||
|
invalidating_methods = set(['PUT', 'DELETE'])
|
||||||
|
|
||||||
|
def __init__(self, cache=None, cache_etags=True, cache_all=False, *args, **kw):
|
||||||
|
super(CacheControlAdapter, self).__init__(*args, **kw)
|
||||||
|
self.cache = cache or DictCache()
|
||||||
|
self.controller = CacheController(self.cache, cache_etags=cache_etags, cache_all=cache_all)
|
||||||
|
|
||||||
|
def send(self, request, **kw):
|
||||||
|
"""Send a request. Use the request information to see if it
|
||||||
|
exists in the cache.
|
||||||
|
"""
|
||||||
|
if request.method == 'GET':
|
||||||
|
cached_response = self.controller.cached_request(
|
||||||
|
request.url, request.headers
|
||||||
|
)
|
||||||
|
if cached_response:
|
||||||
|
# Cached responses should not have a raw field since
|
||||||
|
# they *cannot* be created from some stream.
|
||||||
|
cached_response.raw = None
|
||||||
|
return cached_response
|
||||||
|
|
||||||
|
# check for etags and add headers if appropriate
|
||||||
|
headers = self.controller.add_headers(request.url)
|
||||||
|
request.headers.update(headers)
|
||||||
|
|
||||||
|
resp = super(CacheControlAdapter, self).send(request, **kw)
|
||||||
|
return resp
|
||||||
|
|
||||||
|
def build_response(self, request, response):
|
||||||
|
"""Build a response by making a request or using the cache.
|
||||||
|
|
||||||
|
This will end up calling send and returning a potentially
|
||||||
|
cached response
|
||||||
|
"""
|
||||||
|
resp = super(CacheControlAdapter, self).build_response(
|
||||||
|
request, response
|
||||||
|
)
|
||||||
|
|
||||||
|
# See if we should invalidate the cache.
|
||||||
|
if request.method in self.invalidating_methods and resp.ok:
|
||||||
|
cache_url = self.controller.cache_url(request.url)
|
||||||
|
self.cache.delete(cache_url)
|
||||||
|
|
||||||
|
# Try to store the response if it is a GET
|
||||||
|
elif request.method == 'GET':
|
||||||
|
if response.status == 304:
|
||||||
|
# We must have sent an ETag request. This could mean
|
||||||
|
# that we've been expired already or that we simply
|
||||||
|
# have an etag. In either case, we want to try and
|
||||||
|
# update the cache if that is the case.
|
||||||
|
resp = self.controller.update_cached_response(
|
||||||
|
request, response
|
||||||
|
)
|
||||||
|
# Fix possible exception when using missing `raw` field in
|
||||||
|
# requests
|
||||||
|
# TODO: remove when requests will be bump to 2.2.2 or 2.3
|
||||||
|
# version
|
||||||
|
resp.raw = None
|
||||||
|
else:
|
||||||
|
# try to cache the response
|
||||||
|
self.controller.cache_response(request, resp)
|
||||||
|
|
||||||
|
# Give the request a from_cache attr to let people use it
|
||||||
|
# rather than testing for hasattr.
|
||||||
|
if not hasattr(resp, 'from_cache'):
|
||||||
|
resp.from_cache = False
|
||||||
|
|
||||||
|
return resp
|
36
lib/cachecontrol/cache.py
Normal file
36
lib/cachecontrol/cache.py
Normal file
@ -0,0 +1,36 @@
|
|||||||
|
"""
|
||||||
|
The cache object API for implementing caches. The default is just a
|
||||||
|
dictionary, which in turns means it is not threadsafe for writing.
|
||||||
|
"""
|
||||||
|
from threading import Lock
|
||||||
|
|
||||||
|
|
||||||
|
class BaseCache(object):
|
||||||
|
|
||||||
|
def get(self, key):
|
||||||
|
raise NotImplemented()
|
||||||
|
|
||||||
|
def set(self, key, value):
|
||||||
|
raise NotImplemented()
|
||||||
|
|
||||||
|
def delete(self, key):
|
||||||
|
raise NotImplemented()
|
||||||
|
|
||||||
|
|
||||||
|
class DictCache(BaseCache):
|
||||||
|
|
||||||
|
def __init__(self, init_dict=None):
|
||||||
|
self.lock = Lock()
|
||||||
|
self.data = init_dict or {}
|
||||||
|
|
||||||
|
def get(self, key):
|
||||||
|
return self.data.get(key, None)
|
||||||
|
|
||||||
|
def set(self, key, value):
|
||||||
|
with self.lock:
|
||||||
|
self.data.update({key: value})
|
||||||
|
|
||||||
|
def delete(self, key):
|
||||||
|
with self.lock:
|
||||||
|
if key in self.data:
|
||||||
|
self.data.pop(key)
|
18
lib/cachecontrol/caches/__init__.py
Normal file
18
lib/cachecontrol/caches/__init__.py
Normal file
@ -0,0 +1,18 @@
|
|||||||
|
from textwrap import dedent
|
||||||
|
|
||||||
|
try:
|
||||||
|
from cachecontrol.caches.file_cache import FileCache
|
||||||
|
except ImportError:
|
||||||
|
notice = dedent('''
|
||||||
|
NOTE: In order to use the FileCache you must have
|
||||||
|
lockfile installed. You can install it via pip:
|
||||||
|
pip install lockfile
|
||||||
|
''')
|
||||||
|
print(notice)
|
||||||
|
|
||||||
|
|
||||||
|
try:
|
||||||
|
import redis
|
||||||
|
from cachecontrol.caches.redis_cache import RedisCache
|
||||||
|
except ImportError:
|
||||||
|
pass
|
51
lib/cachecontrol/caches/file_cache.py
Normal file
51
lib/cachecontrol/caches/file_cache.py
Normal file
@ -0,0 +1,51 @@
|
|||||||
|
import os
|
||||||
|
import sys
|
||||||
|
from hashlib import md5
|
||||||
|
|
||||||
|
try:
|
||||||
|
from pickle import load, dump, HIGHEST_PROTOCOL
|
||||||
|
except ImportError:
|
||||||
|
from cPickle import load, dump, HIGHEST_PROTOCOL
|
||||||
|
|
||||||
|
from lockfile import FileLock
|
||||||
|
|
||||||
|
|
||||||
|
class FileCache(object):
|
||||||
|
def __init__(self, directory, forever=False):
|
||||||
|
self.directory = directory
|
||||||
|
self.forever = forever
|
||||||
|
|
||||||
|
if not os.path.isdir(self.directory):
|
||||||
|
os.mkdir(self.directory)
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def encode(x):
|
||||||
|
return md5(x.encode()).hexdigest()
|
||||||
|
|
||||||
|
def _fn(self, name):
|
||||||
|
return os.path.join(self.directory, self.encode(name))
|
||||||
|
|
||||||
|
def get(self, key):
|
||||||
|
name = self._fn(key)
|
||||||
|
if not os.path.exists(name):
|
||||||
|
return None
|
||||||
|
|
||||||
|
with open(name, 'rb') as fh:
|
||||||
|
try:
|
||||||
|
if sys.version < '3':
|
||||||
|
return load(fh)
|
||||||
|
else:
|
||||||
|
return load(fh, encoding='latin1')
|
||||||
|
except ValueError:
|
||||||
|
return None
|
||||||
|
|
||||||
|
def set(self, key, value):
|
||||||
|
name = self._fn(key)
|
||||||
|
with FileLock(name) as lock:
|
||||||
|
with open(lock.path, 'wb') as fh:
|
||||||
|
dump(value, fh, HIGHEST_PROTOCOL)
|
||||||
|
|
||||||
|
def delete(self, key):
|
||||||
|
name = self._fn(key)
|
||||||
|
if not self.forever:
|
||||||
|
os.remove(name)
|
46
lib/cachecontrol/caches/redis_cache.py
Normal file
46
lib/cachecontrol/caches/redis_cache.py
Normal file
@ -0,0 +1,46 @@
|
|||||||
|
from __future__ import division
|
||||||
|
|
||||||
|
from datetime import datetime
|
||||||
|
|
||||||
|
try:
|
||||||
|
from cPickle import loads, dumps
|
||||||
|
except ImportError: # Python 3.x
|
||||||
|
from pickle import loads, dumps
|
||||||
|
|
||||||
|
|
||||||
|
def total_seconds(td):
|
||||||
|
"""Python 2.6 compatability"""
|
||||||
|
if hasattr(td, 'total_seconds'):
|
||||||
|
return td.total_seconds()
|
||||||
|
|
||||||
|
ms = td.microseconds
|
||||||
|
secs = (td.seconds + td.days * 24 * 3600)
|
||||||
|
return (ms + secs * 10**6) / 10**6
|
||||||
|
|
||||||
|
|
||||||
|
class RedisCache(object):
|
||||||
|
|
||||||
|
def __init__(self, conn):
|
||||||
|
self.conn = conn
|
||||||
|
|
||||||
|
def get(self, key):
|
||||||
|
val = self.conn.get(key)
|
||||||
|
if val:
|
||||||
|
return loads(val)
|
||||||
|
return None
|
||||||
|
|
||||||
|
def set(self, key, value, expires=None):
|
||||||
|
if not expires:
|
||||||
|
self.conn.set(key, dumps(value))
|
||||||
|
else:
|
||||||
|
expires = expires - datetime.now()
|
||||||
|
self.conn.setex(key, total_seconds(expires), value)
|
||||||
|
|
||||||
|
def delete(self, key):
|
||||||
|
self.conn.delete(key)
|
||||||
|
|
||||||
|
def clear(self):
|
||||||
|
"""Helper for clearing all the keys in a database. Use with
|
||||||
|
caution!"""
|
||||||
|
for key in self.conn.keys():
|
||||||
|
self.conn.delete(key)
|
12
lib/cachecontrol/compat.py
Normal file
12
lib/cachecontrol/compat.py
Normal file
@ -0,0 +1,12 @@
|
|||||||
|
try:
|
||||||
|
from urllib.parse import urljoin
|
||||||
|
except ImportError:
|
||||||
|
from urlparse import urljoin
|
||||||
|
|
||||||
|
|
||||||
|
try:
|
||||||
|
import email.utils
|
||||||
|
parsedate_tz = email.utils.parsedate_tz
|
||||||
|
except ImportError:
|
||||||
|
import email.Utils
|
||||||
|
parsedate_tz = email.Utils.parsedate_tz
|
258
lib/cachecontrol/controller.py
Normal file
258
lib/cachecontrol/controller.py
Normal file
@ -0,0 +1,258 @@
|
|||||||
|
"""
|
||||||
|
The httplib2 algorithms ported for use with requests.
|
||||||
|
"""
|
||||||
|
import re
|
||||||
|
import calendar
|
||||||
|
import time
|
||||||
|
import datetime
|
||||||
|
|
||||||
|
from cachecontrol.cache import DictCache
|
||||||
|
from cachecontrol.compat import parsedate_tz
|
||||||
|
|
||||||
|
|
||||||
|
URI = re.compile(r"^(([^:/?#]+):)?(//([^/?#]*))?([^?#]*)(\?([^#]*))?(#(.*))?")
|
||||||
|
|
||||||
|
|
||||||
|
def parse_uri(uri):
|
||||||
|
"""Parses a URI using the regex given in Appendix B of RFC 3986.
|
||||||
|
|
||||||
|
(scheme, authority, path, query, fragment) = parse_uri(uri)
|
||||||
|
"""
|
||||||
|
groups = URI.match(uri).groups()
|
||||||
|
return (groups[1], groups[3], groups[4], groups[6], groups[8])
|
||||||
|
|
||||||
|
|
||||||
|
class CacheController(object):
|
||||||
|
"""An interface to see if request should cached or not.
|
||||||
|
"""
|
||||||
|
def __init__(self, cache=None, cache_etags=True, cache_all=False):
|
||||||
|
self.cache = cache or DictCache()
|
||||||
|
self.cache_etags = cache_etags
|
||||||
|
self.cache_all = cache_all
|
||||||
|
|
||||||
|
def _urlnorm(self, uri):
|
||||||
|
"""Normalize the URL to create a safe key for the cache"""
|
||||||
|
(scheme, authority, path, query, fragment) = parse_uri(uri)
|
||||||
|
if not scheme or not authority:
|
||||||
|
raise Exception("Only absolute URIs are allowed. uri = %s" % uri)
|
||||||
|
authority = authority.lower()
|
||||||
|
scheme = scheme.lower()
|
||||||
|
if not path:
|
||||||
|
path = "/"
|
||||||
|
|
||||||
|
# Could do syntax based normalization of the URI before
|
||||||
|
# computing the digest. See Section 6.2.2 of Std 66.
|
||||||
|
request_uri = query and "?".join([path, query]) or path
|
||||||
|
scheme = scheme.lower()
|
||||||
|
defrag_uri = scheme + "://" + authority + request_uri
|
||||||
|
|
||||||
|
return defrag_uri
|
||||||
|
|
||||||
|
def cache_url(self, uri):
|
||||||
|
return self._urlnorm(uri)
|
||||||
|
|
||||||
|
def parse_cache_control(self, headers):
|
||||||
|
"""
|
||||||
|
Parse the cache control headers returning a dictionary with values
|
||||||
|
for the different directives.
|
||||||
|
"""
|
||||||
|
retval = {}
|
||||||
|
|
||||||
|
cc_header = 'cache-control'
|
||||||
|
if 'Cache-Control' in headers:
|
||||||
|
cc_header = 'Cache-Control'
|
||||||
|
|
||||||
|
if cc_header in headers:
|
||||||
|
parts = headers[cc_header].split(',')
|
||||||
|
parts_with_args = [
|
||||||
|
tuple([x.strip().lower() for x in part.split("=", 1)])
|
||||||
|
for part in parts if -1 != part.find("=")]
|
||||||
|
parts_wo_args = [(name.strip().lower(), 1)
|
||||||
|
for name in parts if -1 == name.find("=")]
|
||||||
|
retval = dict(parts_with_args + parts_wo_args)
|
||||||
|
return retval
|
||||||
|
|
||||||
|
def cached_request(self, url, headers):
|
||||||
|
cache_url = self.cache_url(url)
|
||||||
|
cc = self.parse_cache_control(headers)
|
||||||
|
|
||||||
|
# non-caching states
|
||||||
|
no_cache = True if 'no-cache' in cc else False
|
||||||
|
if 'max-age' in cc and cc['max-age'] == 0:
|
||||||
|
no_cache = True
|
||||||
|
|
||||||
|
# see if it is in the cache anyways
|
||||||
|
in_cache = self.cache.get(cache_url)
|
||||||
|
if no_cache or not in_cache:
|
||||||
|
return False
|
||||||
|
|
||||||
|
# It is in the cache, so lets see if it is going to be
|
||||||
|
# fresh enough
|
||||||
|
resp = self.cache.get(cache_url)
|
||||||
|
|
||||||
|
# Check our Vary header to make sure our request headers match
|
||||||
|
# up. We don't delete it from the though, we just don't return
|
||||||
|
# our cached value.
|
||||||
|
#
|
||||||
|
# NOTE: Because httplib2 stores raw content, it denotes
|
||||||
|
# headers that were sent in the original response by
|
||||||
|
# adding -varied-$name. We don't have to do that b/c we
|
||||||
|
# are storing the object which has a reference to the
|
||||||
|
# original request. If that changes, then I'd propose
|
||||||
|
# using the varied headers in the cache key to avoid the
|
||||||
|
# situation all together.
|
||||||
|
if 'vary' in resp.headers:
|
||||||
|
varied_headers = resp.headers['vary'].replace(' ', '').split(',')
|
||||||
|
original_headers = resp.request.headers
|
||||||
|
for header in varied_headers:
|
||||||
|
# If our headers don't match for the headers listed in
|
||||||
|
# the vary header, then don't use the cached response
|
||||||
|
if headers.get(header, None) != original_headers.get(header):
|
||||||
|
return False
|
||||||
|
|
||||||
|
now = time.time()
|
||||||
|
date = calendar.timegm(
|
||||||
|
parsedate_tz(resp.headers['date'])
|
||||||
|
)
|
||||||
|
current_age = max(0, now - date)
|
||||||
|
|
||||||
|
# TODO: There is an assumption that the result will be a
|
||||||
|
# requests response object. This may not be best since we
|
||||||
|
# could probably avoid instantiating or constructing the
|
||||||
|
# response until we know we need it.
|
||||||
|
resp_cc = self.parse_cache_control(resp.headers)
|
||||||
|
|
||||||
|
# determine freshness
|
||||||
|
freshness_lifetime = 0
|
||||||
|
if 'max-age' in resp_cc and resp_cc['max-age'].isdigit():
|
||||||
|
freshness_lifetime = int(resp_cc['max-age'])
|
||||||
|
elif 'expires' in resp.headers:
|
||||||
|
expires = parsedate_tz(resp.headers['expires'])
|
||||||
|
if expires is not None:
|
||||||
|
expire_time = calendar.timegm(expires) - date
|
||||||
|
freshness_lifetime = max(0, expire_time)
|
||||||
|
|
||||||
|
# determine if we are setting freshness limit in the req
|
||||||
|
if 'max-age' in cc:
|
||||||
|
try:
|
||||||
|
freshness_lifetime = int(cc['max-age'])
|
||||||
|
except ValueError:
|
||||||
|
freshness_lifetime = 0
|
||||||
|
|
||||||
|
if 'min-fresh' in cc:
|
||||||
|
try:
|
||||||
|
min_fresh = int(cc['min-fresh'])
|
||||||
|
except ValueError:
|
||||||
|
min_fresh = 0
|
||||||
|
# adjust our current age by our min fresh
|
||||||
|
current_age += min_fresh
|
||||||
|
|
||||||
|
# see how fresh we actually are
|
||||||
|
fresh = (freshness_lifetime > current_age)
|
||||||
|
|
||||||
|
if fresh:
|
||||||
|
# make sure we set the from_cache to true
|
||||||
|
resp.from_cache = True
|
||||||
|
return resp
|
||||||
|
|
||||||
|
# we're not fresh. If we don't have an Etag, clear it out
|
||||||
|
if 'etag' not in resp.headers:
|
||||||
|
self.cache.delete(cache_url)
|
||||||
|
|
||||||
|
if 'etag' in resp.headers:
|
||||||
|
headers['If-None-Match'] = resp.headers['ETag']
|
||||||
|
|
||||||
|
if 'last-modified' in resp.headers:
|
||||||
|
headers['If-Modified-Since'] = resp.headers['Last-Modified']
|
||||||
|
|
||||||
|
# return the original handler
|
||||||
|
return False
|
||||||
|
|
||||||
|
def add_headers(self, url):
|
||||||
|
resp = self.cache.get(url)
|
||||||
|
if resp and 'etag' in resp.headers:
|
||||||
|
return {'If-None-Match': resp.headers['etag']}
|
||||||
|
return {}
|
||||||
|
|
||||||
|
def cache_response(self, request, resp):
|
||||||
|
"""
|
||||||
|
Algorithm for caching requests.
|
||||||
|
|
||||||
|
This assumes a requests Response object.
|
||||||
|
"""
|
||||||
|
# From httplib2: Don't cache 206's since we aren't going to
|
||||||
|
# handle byte range requests
|
||||||
|
if resp.status_code not in [200, 203]:
|
||||||
|
return
|
||||||
|
|
||||||
|
cc_req = self.parse_cache_control(request.headers)
|
||||||
|
cc = self.parse_cache_control(resp.headers)
|
||||||
|
|
||||||
|
cache_url = self.cache_url(request.url)
|
||||||
|
|
||||||
|
# Delete it from the cache if we happen to have it stored there
|
||||||
|
no_store = cc.get('no-store') or cc_req.get('no-store')
|
||||||
|
if no_store and self.cache.get(cache_url):
|
||||||
|
self.cache.delete(cache_url)
|
||||||
|
|
||||||
|
# If we've been given an etag, then keep the response
|
||||||
|
if self.cache_etags and 'etag' in resp.headers:
|
||||||
|
self.cache.set(cache_url, resp)
|
||||||
|
|
||||||
|
# If we want to cache sites not setup with cache headers then add the proper headers and keep the response
|
||||||
|
if self.cache_all:
|
||||||
|
expires = datetime.datetime.utcnow() + datetime.timedelta(days=(25 * 365))
|
||||||
|
expires = expires.strftime("%a, %d %b %Y %H:%M:%S GMT")
|
||||||
|
headers = {'Cache-Control': 'public,max-age=%d' % int(3600),
|
||||||
|
'Expires': expires}
|
||||||
|
resp.headers.update(headers)
|
||||||
|
self.cache.set(cache_url, resp)
|
||||||
|
|
||||||
|
# Add to the cache if the response headers demand it. If there
|
||||||
|
# is no date header then we can't do anything about expiring
|
||||||
|
# the cache.
|
||||||
|
elif 'date' in resp.headers:
|
||||||
|
# cache when there is a max-age > 0
|
||||||
|
if cc and cc.get('max-age'):
|
||||||
|
if int(cc['max-age']) > 0:
|
||||||
|
self.cache.set(cache_url, resp)
|
||||||
|
|
||||||
|
# If the request can expire, it means we should cache it
|
||||||
|
# in the meantime.
|
||||||
|
elif 'expires' in resp.headers:
|
||||||
|
if resp.headers['expires']:
|
||||||
|
self.cache.set(cache_url, resp)
|
||||||
|
|
||||||
|
def update_cached_response(self, request, response):
|
||||||
|
"""On a 304 we will get a new set of headers that we want to
|
||||||
|
update our cached value with, assuming we have one.
|
||||||
|
|
||||||
|
This should only ever be called when we've sent an ETag and
|
||||||
|
gotten a 304 as the response.
|
||||||
|
"""
|
||||||
|
cache_url = self.cache_url(request.url)
|
||||||
|
|
||||||
|
resp = self.cache.get(cache_url)
|
||||||
|
|
||||||
|
if not resp:
|
||||||
|
# we didn't have a cached response
|
||||||
|
return response
|
||||||
|
|
||||||
|
# did so lets update our headers
|
||||||
|
resp.headers.update(resp.headers)
|
||||||
|
|
||||||
|
# we want a 200 b/c we have content via the cache
|
||||||
|
request.status_code = 200
|
||||||
|
|
||||||
|
# update the request as it has the if-none-match header + any
|
||||||
|
# other headers that the server might have updated (ie Date,
|
||||||
|
# Cache-Control, Expires, etc.)
|
||||||
|
resp.request = request
|
||||||
|
|
||||||
|
# update our cache
|
||||||
|
self.cache.set(cache_url, resp)
|
||||||
|
|
||||||
|
# Let everyone know this was from the cache.
|
||||||
|
resp.from_cache = True
|
||||||
|
|
||||||
|
return resp
|
56
lib/cachecontrol/patch_requests.py
Normal file
56
lib/cachecontrol/patch_requests.py
Normal file
@ -0,0 +1,56 @@
|
|||||||
|
import requests
|
||||||
|
|
||||||
|
from requests import models
|
||||||
|
from requests.packages.urllib3.response import HTTPResponse
|
||||||
|
|
||||||
|
__attrs__ = [
|
||||||
|
'_content',
|
||||||
|
'status_code',
|
||||||
|
'headers',
|
||||||
|
'url',
|
||||||
|
'history',
|
||||||
|
'encoding',
|
||||||
|
'reason',
|
||||||
|
'cookies',
|
||||||
|
'elapsed',
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
|
def response_getstate(self):
|
||||||
|
# consume everything
|
||||||
|
if not self._content_consumed:
|
||||||
|
self.content
|
||||||
|
|
||||||
|
state = dict(
|
||||||
|
(attr, getattr(self, attr, None))
|
||||||
|
for attr in __attrs__
|
||||||
|
)
|
||||||
|
|
||||||
|
# deal with our raw content b/c we need it for our cookie jar
|
||||||
|
state['raw_original_response'] = self.raw._original_response
|
||||||
|
return state
|
||||||
|
|
||||||
|
|
||||||
|
def response_setstate(self, state):
|
||||||
|
for name, value in state.items():
|
||||||
|
if name != 'raw_original_response':
|
||||||
|
setattr(self, name, value)
|
||||||
|
|
||||||
|
setattr(self, 'raw', HTTPResponse())
|
||||||
|
self.raw._original_response = state['raw_original_response']
|
||||||
|
|
||||||
|
|
||||||
|
def make_responses_pickleable():
|
||||||
|
try:
|
||||||
|
version_parts = [int(part) for part in requests.__version__.split('.')]
|
||||||
|
|
||||||
|
# must be >= 2.2.x
|
||||||
|
if not version_parts[0] >= 2 or not version_parts[1] >= 2:
|
||||||
|
models.Response.__getstate__ = response_getstate
|
||||||
|
models.Response.__setstate__ = response_setstate
|
||||||
|
except:
|
||||||
|
raise
|
||||||
|
pass
|
||||||
|
|
||||||
|
|
||||||
|
make_responses_pickleable()
|
10
lib/cachecontrol/wrapper.py
Normal file
10
lib/cachecontrol/wrapper.py
Normal file
@ -0,0 +1,10 @@
|
|||||||
|
from cachecontrol.adapter import CacheControlAdapter
|
||||||
|
from cachecontrol.cache import DictCache
|
||||||
|
|
||||||
|
|
||||||
|
def CacheControl(sess, cache=None, cache_etags=True, cache_all=False):
|
||||||
|
cache = cache or DictCache()
|
||||||
|
adapter = CacheControlAdapter(cache, cache_etags=cache_etags, cache_all=cache_all)
|
||||||
|
sess.mount('http://', adapter)
|
||||||
|
|
||||||
|
return sess
|
@ -1,14 +0,0 @@
|
|||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
__init__.py
|
|
||||||
~~~~~~~~~~~
|
|
||||||
|
|
||||||
Defines the public API to the httpcache module.
|
|
||||||
"""
|
|
||||||
|
|
||||||
__version__ = '0.1.3'
|
|
||||||
|
|
||||||
from .cache import HTTPCache
|
|
||||||
from .adapter import CachingHTTPAdapter
|
|
||||||
|
|
||||||
__all__ = [HTTPCache, CachingHTTPAdapter]
|
|
@ -1,55 +0,0 @@
|
|||||||
"""
|
|
||||||
adapter.py
|
|
||||||
~~~~~~~~~~
|
|
||||||
|
|
||||||
Contains an implementation of an HTTP adapter for Requests that is aware of the
|
|
||||||
cache contained in this module.
|
|
||||||
"""
|
|
||||||
from requests.adapters import HTTPAdapter
|
|
||||||
from .cache import HTTPCache
|
|
||||||
|
|
||||||
|
|
||||||
class CachingHTTPAdapter(HTTPAdapter):
|
|
||||||
"""
|
|
||||||
A HTTP-caching-aware Transport Adapter for Python Requests. The central
|
|
||||||
portion of the API.
|
|
||||||
|
|
||||||
:param capacity: The maximum capacity of the backing cache.
|
|
||||||
"""
|
|
||||||
def __init__(self, capacity=50, **kwargs):
|
|
||||||
super(CachingHTTPAdapter, self).__init__(**kwargs)
|
|
||||||
|
|
||||||
#: The HTTP Cache backing the adapter.
|
|
||||||
self.cache = HTTPCache(capacity=capacity)
|
|
||||||
|
|
||||||
def send(self, request, **kwargs):
|
|
||||||
"""
|
|
||||||
Sends a PreparedRequest object, respecting RFC 2616's rules about HTTP
|
|
||||||
caching. Returns a Response object that may have been cached.
|
|
||||||
|
|
||||||
:param request: The Requests :class:`PreparedRequest <PreparedRequest>` object to send.
|
|
||||||
"""
|
|
||||||
cached_resp = self.cache.retrieve(request)
|
|
||||||
|
|
||||||
if cached_resp is not None:
|
|
||||||
return cached_resp
|
|
||||||
else:
|
|
||||||
return super(CachingHTTPAdapter, self).send(request, **kwargs)
|
|
||||||
|
|
||||||
def build_response(self, request, response):
|
|
||||||
"""
|
|
||||||
Builds a Response object from a urllib3 response. May involve returning
|
|
||||||
a cached Response.
|
|
||||||
|
|
||||||
:param request: The Requests :class:`PreparedRequest <PreparedRequest>` object sent.
|
|
||||||
:param response: The urllib3 response.
|
|
||||||
"""
|
|
||||||
resp = super(CachingHTTPAdapter, self).build_response(request,
|
|
||||||
response)
|
|
||||||
|
|
||||||
if resp.status_code == 304:
|
|
||||||
resp = self.cache.handle_304(resp)
|
|
||||||
else:
|
|
||||||
self.cache.store(resp)
|
|
||||||
|
|
||||||
return resp
|
|
@ -1,207 +0,0 @@
|
|||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
cache.py
|
|
||||||
~~~~~~~~
|
|
||||||
|
|
||||||
Contains the primary cache structure used in http-cache.
|
|
||||||
"""
|
|
||||||
from .structures import RecentOrderedDict
|
|
||||||
from .utils import (parse_date_header, build_date_header,
|
|
||||||
expires_from_cache_control, url_contains_query)
|
|
||||||
from datetime import datetime
|
|
||||||
|
|
||||||
|
|
||||||
# RFC 2616 specifies that we can cache 200 OK, 203 Non Authoritative,
|
|
||||||
# 206 Partial Content, 300 Multiple Choices, 301 Moved Permanently and
|
|
||||||
# 410 Gone responses. We don't cache 206s at the moment because we
|
|
||||||
# don't handle Range and Content-Range headers.
|
|
||||||
CACHEABLE_RCS = (200, 203, 300, 301, 410)
|
|
||||||
|
|
||||||
# Cacheable verbs.
|
|
||||||
CACHEABLE_VERBS = ('GET', 'HEAD', 'OPTIONS')
|
|
||||||
|
|
||||||
# Some verbs MUST invalidate the resource in the cache, according to RFC 2616.
|
|
||||||
# If we send one of these, or any verb we don't recognise, invalidate the
|
|
||||||
# cache entry for that URL. As it happens, these are also the cacheable
|
|
||||||
# verbs. That works out well for us.
|
|
||||||
NON_INVALIDATING_VERBS = CACHEABLE_VERBS
|
|
||||||
|
|
||||||
|
|
||||||
class HTTPCache(object):
|
|
||||||
"""
|
|
||||||
The HTTP Cache object. Manages caching of responses according to RFC 2616,
|
|
||||||
adding necessary headers to HTTP request objects, and returning cached
|
|
||||||
responses based on server responses.
|
|
||||||
|
|
||||||
This object is not expected to be used by most users. It is exposed as part
|
|
||||||
of the public API for users who feel the need for more control. This API
|
|
||||||
may change in a minor version increase. Be warned.
|
|
||||||
|
|
||||||
:param capacity: (Optional) The maximum capacity of the HTTP cache.
|
|
||||||
"""
|
|
||||||
def __init__(self, capacity=50):
|
|
||||||
#: The maximum capacity of the HTTP cache. When this many cache entries
|
|
||||||
#: end up in the cache, the oldest entries are removed.
|
|
||||||
self.capacity = capacity
|
|
||||||
|
|
||||||
#: The cache backing store. Cache entries are stored here as key-value
|
|
||||||
#: pairs. The key is the URL used to retrieve the cached response. The
|
|
||||||
#: value is a python dict, which stores three objects: the response
|
|
||||||
#: (keyed off of 'response'), the retrieval or creation date (keyed off
|
|
||||||
#: of 'creation') and the cache expiry date (keyed off of 'expiry').
|
|
||||||
#: This last value may be None.
|
|
||||||
self._cache = RecentOrderedDict()
|
|
||||||
|
|
||||||
def store(self, response):
|
|
||||||
"""
|
|
||||||
Takes an HTTP response object and stores it in the cache according to
|
|
||||||
RFC 2616. Returns a boolean value indicating whether the response was
|
|
||||||
cached or not.
|
|
||||||
|
|
||||||
:param response: Requests :class:`Response <Response>` object to cache.
|
|
||||||
"""
|
|
||||||
# Define an internal utility function.
|
|
||||||
def date_header_or_default(header_name, default, response):
|
|
||||||
try:
|
|
||||||
date_header = response.headers[header_name]
|
|
||||||
except KeyError:
|
|
||||||
value = default
|
|
||||||
else:
|
|
||||||
value = parse_date_header(date_header)
|
|
||||||
return value
|
|
||||||
|
|
||||||
if response.status_code not in CACHEABLE_RCS:
|
|
||||||
return False
|
|
||||||
|
|
||||||
if response.request.method not in CACHEABLE_VERBS:
|
|
||||||
return False
|
|
||||||
|
|
||||||
url = response.url
|
|
||||||
now = datetime.utcnow()
|
|
||||||
|
|
||||||
# Get the value of the 'Date' header, if it exists. If it doesn't, just
|
|
||||||
# use now.
|
|
||||||
creation = date_header_or_default('Date', now, response)
|
|
||||||
|
|
||||||
# Get the value of the 'Cache-Control' header, if it exists.
|
|
||||||
cc = response.headers.get('Cache-Control', None)
|
|
||||||
if cc is not None:
|
|
||||||
expiry = expires_from_cache_control(cc, now)
|
|
||||||
|
|
||||||
# If the above returns None, we are explicitly instructed not to
|
|
||||||
# cache this.
|
|
||||||
if expiry is None:
|
|
||||||
return False
|
|
||||||
|
|
||||||
# Get the value of the 'Expires' header, if it exists, and if we don't
|
|
||||||
# have anything from the 'Cache-Control' header.
|
|
||||||
if cc is None:
|
|
||||||
expiry = date_header_or_default('Expires', None, response)
|
|
||||||
|
|
||||||
# If the expiry date is earlier or the same as the Date header, don't
|
|
||||||
# cache the response at all.
|
|
||||||
if expiry is not None and expiry <= creation:
|
|
||||||
return False
|
|
||||||
|
|
||||||
# If there's a query portion of the url and it's a GET, don't cache
|
|
||||||
# this unless explicitly instructed to.
|
|
||||||
if expiry is None and response.request.method == 'GET':
|
|
||||||
if url_contains_query(url):
|
|
||||||
return False
|
|
||||||
|
|
||||||
self._cache[url] = {'response': response,
|
|
||||||
'creation': creation,
|
|
||||||
'expiry': expiry}
|
|
||||||
|
|
||||||
self.__reduce_cache_count()
|
|
||||||
|
|
||||||
return True
|
|
||||||
|
|
||||||
def handle_304(self, response):
|
|
||||||
"""
|
|
||||||
Given a 304 response, retrieves the cached entry. This unconditionally
|
|
||||||
returns the cached entry, so it can be used when the 'intelligent'
|
|
||||||
behaviour of retrieve() is not desired.
|
|
||||||
|
|
||||||
Returns None if there is no entry in the cache.
|
|
||||||
|
|
||||||
:param response: The 304 response to find the cached entry for. Should be a Requests :class:`Response <Response>`.
|
|
||||||
"""
|
|
||||||
try:
|
|
||||||
cached_response = self._cache[response.url]['response']
|
|
||||||
except KeyError:
|
|
||||||
cached_response = None
|
|
||||||
|
|
||||||
return cached_response
|
|
||||||
|
|
||||||
def retrieve(self, request):
|
|
||||||
"""
|
|
||||||
Retrieves a cached response if possible.
|
|
||||||
|
|
||||||
If there is a response that can be unconditionally returned (e.g. one
|
|
||||||
that had a Cache-Control header set), that response is returned. If
|
|
||||||
there is one that can be conditionally returned (if a 304 is returned),
|
|
||||||
applies an If-Modified-Since header to the request and returns None.
|
|
||||||
|
|
||||||
:param request: The Requests :class:`PreparedRequest <PreparedRequest>` object.
|
|
||||||
"""
|
|
||||||
return_response = None
|
|
||||||
url = request.url
|
|
||||||
|
|
||||||
try:
|
|
||||||
cached_response = self._cache[url]
|
|
||||||
except KeyError:
|
|
||||||
return None
|
|
||||||
|
|
||||||
if request.method not in NON_INVALIDATING_VERBS:
|
|
||||||
del self._cache[url]
|
|
||||||
return None
|
|
||||||
|
|
||||||
if cached_response['expiry'] is None:
|
|
||||||
# We have no explicit expiry time, so we weren't instructed to
|
|
||||||
# cache. Add an 'If-Modified-Since' header.
|
|
||||||
creation = cached_response['creation']
|
|
||||||
header = build_date_header(creation)
|
|
||||||
request.headers['If-Modified-Since'] = header
|
|
||||||
else:
|
|
||||||
# We have an explicit expiry time. If we're earlier than the expiry
|
|
||||||
# time, return the response.
|
|
||||||
now = datetime.utcnow()
|
|
||||||
|
|
||||||
if now <= cached_response['expiry']:
|
|
||||||
return_response = cached_response['response']
|
|
||||||
else:
|
|
||||||
del self._cache[url]
|
|
||||||
|
|
||||||
return return_response
|
|
||||||
|
|
||||||
def __reduce_cache_count(self):
|
|
||||||
"""
|
|
||||||
Drops the number of entries in the cache to the capacity of the cache.
|
|
||||||
|
|
||||||
Walks the backing RecentOrderedDict in order from oldest to youngest.
|
|
||||||
Deletes cache entries that are either invalid or being speculatively
|
|
||||||
cached until the number of cache entries drops to the capacity. If this
|
|
||||||
leaves the cache above capacity, begins deleting the least-used cache
|
|
||||||
entries that are still valid until the cache has space.
|
|
||||||
"""
|
|
||||||
if len(self._cache) <= self.capacity:
|
|
||||||
return
|
|
||||||
|
|
||||||
to_delete = len(self._cache) - self.capacity
|
|
||||||
keys = list(self._cache.keys())
|
|
||||||
|
|
||||||
for key in keys:
|
|
||||||
if self._cache[key]['expiry'] is None:
|
|
||||||
del self._cache[key]
|
|
||||||
to_delete -= 1
|
|
||||||
|
|
||||||
if to_delete == 0:
|
|
||||||
return
|
|
||||||
|
|
||||||
keys = list(self._cache.keys())
|
|
||||||
|
|
||||||
for i in range(to_delete):
|
|
||||||
del self._cache[keys[i]]
|
|
||||||
|
|
||||||
return
|
|
@ -1,10 +0,0 @@
|
|||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
compat.py
|
|
||||||
~~~~~~~~~
|
|
||||||
|
|
||||||
Defines cross-platform functions and classes needed to achieve proper
|
|
||||||
functionality.
|
|
||||||
"""
|
|
||||||
|
|
||||||
pass
|
|
@ -1,59 +0,0 @@
|
|||||||
"""
|
|
||||||
structures.py
|
|
||||||
~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Defines structures used by the httpcache module.
|
|
||||||
"""
|
|
||||||
|
|
||||||
class RecentOrderedDict(dict):
|
|
||||||
"""
|
|
||||||
A custom variant of the dictionary that ensures that the object most
|
|
||||||
recently inserted _or_ retrieved from the dictionary is enumerated first.
|
|
||||||
"""
|
|
||||||
def __init__(self):
|
|
||||||
self._data = {}
|
|
||||||
self._order = []
|
|
||||||
|
|
||||||
def __setitem__(self, key, value):
|
|
||||||
if key in self._data:
|
|
||||||
self._order.remove(key)
|
|
||||||
|
|
||||||
self._order.append(key)
|
|
||||||
self._data[key] = value
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
value = self._data[key]
|
|
||||||
self._order.remove(key)
|
|
||||||
self._order.append(key)
|
|
||||||
return value
|
|
||||||
|
|
||||||
def __delitem__(self, key):
|
|
||||||
del self._data[key]
|
|
||||||
self._order.remove(key)
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
return self._order
|
|
||||||
|
|
||||||
def __len__(self):
|
|
||||||
return len(self._order)
|
|
||||||
|
|
||||||
def __contains__(self, value):
|
|
||||||
return self._data.__contains__(value)
|
|
||||||
|
|
||||||
def items(self):
|
|
||||||
return [(key, self._data[key]) for key in self._order]
|
|
||||||
|
|
||||||
def keys(self):
|
|
||||||
return self._order
|
|
||||||
|
|
||||||
def values(self):
|
|
||||||
return [self._data[key] for key in self._order]
|
|
||||||
|
|
||||||
def clear(self):
|
|
||||||
self._data = {}
|
|
||||||
self._order = []
|
|
||||||
|
|
||||||
def copy(self):
|
|
||||||
c = RecentOrderedDict()
|
|
||||||
c._data = self._data.copy()
|
|
||||||
c._order = self._order[:]
|
|
@ -1,97 +0,0 @@
|
|||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
utils.py
|
|
||||||
~~~~~~~~
|
|
||||||
|
|
||||||
Utility functions for use with httpcache.
|
|
||||||
"""
|
|
||||||
from datetime import datetime, timedelta
|
|
||||||
|
|
||||||
try: # Python 2
|
|
||||||
from urlparse import urlparse
|
|
||||||
except ImportError: # Python 3
|
|
||||||
from urllib.parse import urlparse
|
|
||||||
|
|
||||||
RFC_1123_DT_STR = "%a, %d %b %Y %H:%M:%S GMT"
|
|
||||||
RFC_850_DT_STR = "%A, %d-%b-%y %H:%M:%S GMT"
|
|
||||||
|
|
||||||
|
|
||||||
def parse_date_header(header):
|
|
||||||
"""
|
|
||||||
Given a date header in the form specified by RFC 2616, return a Python
|
|
||||||
datetime object.
|
|
||||||
|
|
||||||
RFC 2616 specifies three possible formats for date/time headers, and
|
|
||||||
makes it clear that all dates/times should be in UTC/GMT. That is assumed
|
|
||||||
by this library, which simply does everything in UTC. This currently does
|
|
||||||
not parse the C asctime() string, because that's effort.
|
|
||||||
|
|
||||||
This function does _not_ follow Postel's Law. If a format does not strictly
|
|
||||||
match the defined strings, this function returns None. This is considered
|
|
||||||
'safe' behaviour.
|
|
||||||
"""
|
|
||||||
try:
|
|
||||||
dt = datetime.strptime(header, RFC_1123_DT_STR)
|
|
||||||
except ValueError:
|
|
||||||
try:
|
|
||||||
dt = datetime.strptime(header, RFC_850_DT_STR)
|
|
||||||
except ValueError:
|
|
||||||
dt = None
|
|
||||||
except TypeError:
|
|
||||||
dt = None
|
|
||||||
|
|
||||||
return dt
|
|
||||||
|
|
||||||
|
|
||||||
def build_date_header(dt):
|
|
||||||
"""
|
|
||||||
Given a Python datetime object, build a Date header value according to
|
|
||||||
RFC 2616.
|
|
||||||
|
|
||||||
RFC 2616 specifies that the RFC 1123 form is to be preferred, so that is
|
|
||||||
what we use.
|
|
||||||
"""
|
|
||||||
return dt.strftime(RFC_1123_DT_STR)
|
|
||||||
|
|
||||||
|
|
||||||
def expires_from_cache_control(header, current_time):
|
|
||||||
"""
|
|
||||||
Given a Cache-Control header, builds a Python datetime object corresponding
|
|
||||||
to the expiry time (in UTC). This function should respect all relevant
|
|
||||||
Cache-Control directives.
|
|
||||||
|
|
||||||
Takes current_time as an argument to ensure that 'max-age=0' generates the
|
|
||||||
correct behaviour without being special-cased.
|
|
||||||
|
|
||||||
Returns None to indicate that a request must not be cached.
|
|
||||||
"""
|
|
||||||
# Cache control header values are made of multiple comma separated fields.
|
|
||||||
# Splitting them like this is probably a bad idea, but I'm going to roll with
|
|
||||||
# it for now. We'll come back to it.
|
|
||||||
fields = header.split(', ')
|
|
||||||
duration = None
|
|
||||||
|
|
||||||
for field in fields:
|
|
||||||
# Right now we don't handle no-cache applied to specific fields. To be
|
|
||||||
# as 'nice' as possible, treat any no-cache as applying to the whole
|
|
||||||
# request. Bail early, because there's no reason to stick around.
|
|
||||||
if field.startswith('no-cache') or field == 'no-store':
|
|
||||||
return None
|
|
||||||
|
|
||||||
if field.startswith('max-age'):
|
|
||||||
_, duration = field.split('=')
|
|
||||||
duration = int(duration)
|
|
||||||
|
|
||||||
if duration:
|
|
||||||
interval = timedelta(seconds=int(duration))
|
|
||||||
return current_time + interval
|
|
||||||
|
|
||||||
def url_contains_query(url):
|
|
||||||
"""
|
|
||||||
A very stupid function for determining if a URL contains a query string
|
|
||||||
or not.
|
|
||||||
"""
|
|
||||||
if urlparse(url).query:
|
|
||||||
return True
|
|
||||||
else:
|
|
||||||
return False
|
|
@ -1,31 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache
|
|
||||||
~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Transparent cache for ``requests`` library with persistence and async support
|
|
||||||
|
|
||||||
Just write::
|
|
||||||
|
|
||||||
import requests_cache
|
|
||||||
requests_cache.install_cache()
|
|
||||||
|
|
||||||
And requests to resources will be cached for faster repeated access::
|
|
||||||
|
|
||||||
import requests
|
|
||||||
for i in range(10):
|
|
||||||
r = requests.get('http://httpbin.org/delay/5')
|
|
||||||
# will took approximately 5 seconds instead 50
|
|
||||||
|
|
||||||
|
|
||||||
:copyright: (c) 2012 by Roman Haritonov.
|
|
||||||
:license: BSD, see LICENSE for more details.
|
|
||||||
"""
|
|
||||||
__docformat__ = 'restructuredtext'
|
|
||||||
__version__ = '0.4.4'
|
|
||||||
|
|
||||||
from .core import(
|
|
||||||
CachedSession, install_cache, uninstall_cache,
|
|
||||||
disabled, enabled, get_cache, clear, configure
|
|
||||||
)
|
|
@ -1,50 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Classes and functions for cache persistence
|
|
||||||
"""
|
|
||||||
|
|
||||||
|
|
||||||
from .base import BaseCache
|
|
||||||
|
|
||||||
registry = {
|
|
||||||
'memory': BaseCache,
|
|
||||||
}
|
|
||||||
|
|
||||||
try:
|
|
||||||
# Heroku doesn't allow the SQLite3 module to be installed
|
|
||||||
from .sqlite import DbCache
|
|
||||||
registry['sqlite'] = DbCache
|
|
||||||
except ImportError:
|
|
||||||
DbCache = None
|
|
||||||
|
|
||||||
try:
|
|
||||||
from .mongo import MongoCache
|
|
||||||
registry['mongo'] = registry['mongodb'] = MongoCache
|
|
||||||
except ImportError:
|
|
||||||
MongoCache = None
|
|
||||||
|
|
||||||
try:
|
|
||||||
from .redis import RedisCache
|
|
||||||
registry['redis'] = RedisCache
|
|
||||||
except ImportError:
|
|
||||||
RedisCache = None
|
|
||||||
|
|
||||||
|
|
||||||
def create_backend(backend_name, cache_name, options):
|
|
||||||
if backend_name is None:
|
|
||||||
backend_name = _get_default_backend_name()
|
|
||||||
try:
|
|
||||||
return registry[backend_name](cache_name, **options)
|
|
||||||
except KeyError:
|
|
||||||
raise ValueError('Unsupported backend "%s" try one of: %s' %
|
|
||||||
(backend_name, ', '.join(registry.keys())))
|
|
||||||
|
|
||||||
|
|
||||||
def _get_default_backend_name():
|
|
||||||
if 'sqlite' in registry:
|
|
||||||
return 'sqlite'
|
|
||||||
return 'memory'
|
|
@ -1,171 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.base
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Contains BaseCache class which can be used as in-memory cache backend or
|
|
||||||
extended to support persistence.
|
|
||||||
"""
|
|
||||||
from datetime import datetime
|
|
||||||
import hashlib
|
|
||||||
from copy import copy
|
|
||||||
|
|
||||||
import requests
|
|
||||||
|
|
||||||
from ..compat import is_py2
|
|
||||||
|
|
||||||
|
|
||||||
class BaseCache(object):
|
|
||||||
""" Base class for cache implementations, can be used as in-memory cache.
|
|
||||||
|
|
||||||
To extend it you can provide dictionary-like objects for
|
|
||||||
:attr:`keys_map` and :attr:`responses` or override public methods.
|
|
||||||
"""
|
|
||||||
def __init__(self, *args, **kwargs):
|
|
||||||
#: `key` -> `key_in_responses` mapping
|
|
||||||
self.keys_map = {}
|
|
||||||
#: `key_in_cache` -> `response` mapping
|
|
||||||
self.responses = {}
|
|
||||||
|
|
||||||
def save_response(self, key, response):
|
|
||||||
""" Save response to cache
|
|
||||||
|
|
||||||
:param key: key for this response
|
|
||||||
:param response: response to save
|
|
||||||
|
|
||||||
.. note:: Response is reduced before saving (with :meth:`reduce_response`)
|
|
||||||
to make it picklable
|
|
||||||
"""
|
|
||||||
self.responses[key] = self.reduce_response(response), datetime.utcnow()
|
|
||||||
|
|
||||||
def add_key_mapping(self, new_key, key_to_response):
|
|
||||||
"""
|
|
||||||
Adds mapping of `new_key` to `key_to_response` to make it possible to
|
|
||||||
associate many keys with single response
|
|
||||||
|
|
||||||
:param new_key: new key (e.g. url from redirect)
|
|
||||||
:param key_to_response: key which can be found in :attr:`responses`
|
|
||||||
:return:
|
|
||||||
"""
|
|
||||||
self.keys_map[new_key] = key_to_response
|
|
||||||
|
|
||||||
def get_response_and_time(self, key, default=(None, None)):
|
|
||||||
""" Retrieves response and timestamp for `key` if it's stored in cache,
|
|
||||||
otherwise returns `default`
|
|
||||||
|
|
||||||
:param key: key of resource
|
|
||||||
:param default: return this if `key` not found in cache
|
|
||||||
:returns: tuple (response, datetime)
|
|
||||||
|
|
||||||
.. note:: Response is restored after unpickling with :meth:`restore_response`
|
|
||||||
"""
|
|
||||||
try:
|
|
||||||
if key not in self.responses:
|
|
||||||
key = self.keys_map[key]
|
|
||||||
response, timestamp = self.responses[key]
|
|
||||||
except KeyError:
|
|
||||||
return default
|
|
||||||
return self.restore_response(response), timestamp
|
|
||||||
|
|
||||||
def delete(self, key):
|
|
||||||
""" Delete `key` from cache. Also deletes all responses from response history
|
|
||||||
"""
|
|
||||||
try:
|
|
||||||
if key in self.responses:
|
|
||||||
response, _ = self.responses[key]
|
|
||||||
del self.responses[key]
|
|
||||||
else:
|
|
||||||
response, _ = self.responses[self.keys_map[key]]
|
|
||||||
del self.keys_map[key]
|
|
||||||
for r in response.history:
|
|
||||||
del self.keys_map[self.create_key(r.request)]
|
|
||||||
except KeyError:
|
|
||||||
pass
|
|
||||||
|
|
||||||
def delete_url(self, url):
|
|
||||||
""" Delete response associated with `url` from cache.
|
|
||||||
Also deletes all responses from response history. Works only for GET requests
|
|
||||||
"""
|
|
||||||
self.delete(self._url_to_key(url))
|
|
||||||
|
|
||||||
def clear(self):
|
|
||||||
""" Clear cache
|
|
||||||
"""
|
|
||||||
self.responses.clear()
|
|
||||||
self.keys_map.clear()
|
|
||||||
|
|
||||||
def has_key(self, key):
|
|
||||||
""" Returns `True` if cache has `key`, `False` otherwise
|
|
||||||
"""
|
|
||||||
return key in self.responses or key in self.keys_map
|
|
||||||
|
|
||||||
def has_url(self, url):
|
|
||||||
""" Returns `True` if cache has `url`, `False` otherwise.
|
|
||||||
Works only for GET request urls
|
|
||||||
"""
|
|
||||||
return self.has_key(self._url_to_key(url))
|
|
||||||
|
|
||||||
def _url_to_key(self, url):
|
|
||||||
from requests import Request
|
|
||||||
return self.create_key(Request('GET', url).prepare())
|
|
||||||
|
|
||||||
_response_attrs = ['_content', 'url', 'status_code', 'cookies',
|
|
||||||
'headers', 'encoding', 'request', 'reason', 'raw']
|
|
||||||
|
|
||||||
_raw_response_attrs = ['_original_response', 'decode_content', 'headers',
|
|
||||||
'reason', 'status', 'strict', 'version']
|
|
||||||
|
|
||||||
def reduce_response(self, response):
|
|
||||||
""" Reduce response object to make it compatible with ``pickle``
|
|
||||||
"""
|
|
||||||
result = _Store()
|
|
||||||
# prefetch
|
|
||||||
response.content
|
|
||||||
for field in self._response_attrs:
|
|
||||||
setattr(result, field, self._picklable_field(response, field))
|
|
||||||
result.history = tuple(self.reduce_response(r) for r in response.history)
|
|
||||||
return result
|
|
||||||
|
|
||||||
def _picklable_field(self, response, name):
|
|
||||||
value = getattr(response, name)
|
|
||||||
if name == 'request':
|
|
||||||
value = copy(value)
|
|
||||||
value.hooks = []
|
|
||||||
elif name == 'raw':
|
|
||||||
result = _Store()
|
|
||||||
for field in self._raw_response_attrs:
|
|
||||||
setattr(result, field, getattr(value, field, None))
|
|
||||||
value = result
|
|
||||||
return value
|
|
||||||
|
|
||||||
def restore_response(self, response):
|
|
||||||
""" Restore response object after unpickling
|
|
||||||
"""
|
|
||||||
result = requests.Response()
|
|
||||||
for field in self._response_attrs:
|
|
||||||
setattr(result, field, getattr(response, field, None))
|
|
||||||
result.history = tuple(self.restore_response(r) for r in response.history)
|
|
||||||
return result
|
|
||||||
|
|
||||||
def create_key(self, request):
|
|
||||||
key = hashlib.sha256()
|
|
||||||
key.update(_to_bytes(request.method.upper()))
|
|
||||||
key.update(_to_bytes(request.url))
|
|
||||||
if request.body:
|
|
||||||
key.update(_to_bytes(request.body))
|
|
||||||
return key.hexdigest()
|
|
||||||
|
|
||||||
def __str__(self):
|
|
||||||
return 'keys: %s\nresponses: %s' % (self.keys_map, self.responses)
|
|
||||||
|
|
||||||
|
|
||||||
# used for saving response attributes
|
|
||||||
class _Store(object):
|
|
||||||
pass
|
|
||||||
|
|
||||||
|
|
||||||
def _to_bytes(s, encoding='utf-8'):
|
|
||||||
if is_py2 or isinstance(s, bytes):
|
|
||||||
return s
|
|
||||||
return bytes(s, encoding)
|
|
@ -1,25 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.mongo
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
``mongo`` cache backend
|
|
||||||
"""
|
|
||||||
from .base import BaseCache
|
|
||||||
from .storage.mongodict import MongoDict, MongoPickleDict
|
|
||||||
|
|
||||||
|
|
||||||
class MongoCache(BaseCache):
|
|
||||||
""" ``mongo`` cache backend.
|
|
||||||
"""
|
|
||||||
def __init__(self, db_name='requests-cache', **options):
|
|
||||||
"""
|
|
||||||
:param db_name: database name (default: ``'requests-cache'``)
|
|
||||||
:param connection: (optional) ``pymongo.Connection``
|
|
||||||
"""
|
|
||||||
super(MongoCache, self).__init__()
|
|
||||||
self.responses = MongoPickleDict(db_name, 'responses',
|
|
||||||
options.get('connection'))
|
|
||||||
self.keys_map = MongoDict(db_name, 'urls', self.responses.connection)
|
|
||||||
|
|
@ -1,24 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.redis
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
``redis`` cache backend
|
|
||||||
"""
|
|
||||||
from .base import BaseCache
|
|
||||||
from .storage.redisdict import RedisDict
|
|
||||||
|
|
||||||
|
|
||||||
class RedisCache(BaseCache):
|
|
||||||
""" ``redis`` cache backend.
|
|
||||||
"""
|
|
||||||
def __init__(self, namespace='requests-cache', **options):
|
|
||||||
"""
|
|
||||||
:param namespace: redis namespace (default: ``'requests-cache'``)
|
|
||||||
:param connection: (optional) ``redis.StrictRedis``
|
|
||||||
"""
|
|
||||||
super(RedisCache, self).__init__()
|
|
||||||
self.responses = RedisDict(namespace, 'responses',
|
|
||||||
options.get('connection'))
|
|
||||||
self.keys_map = RedisDict(namespace, 'urls', self.responses.connection)
|
|
@ -1,30 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.sqlite
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
``sqlite3`` cache backend
|
|
||||||
"""
|
|
||||||
from .base import BaseCache
|
|
||||||
from .storage.dbdict import DbDict, DbPickleDict
|
|
||||||
|
|
||||||
|
|
||||||
class DbCache(BaseCache):
|
|
||||||
""" sqlite cache backend.
|
|
||||||
|
|
||||||
Reading is fast, saving is a bit slower. It can store big amount of data
|
|
||||||
with low memory usage.
|
|
||||||
"""
|
|
||||||
def __init__(self, location='cache',
|
|
||||||
fast_save=False, extension='.sqlite', **options):
|
|
||||||
"""
|
|
||||||
:param location: database filename prefix (default: ``'cache'``)
|
|
||||||
:param fast_save: Speedup cache saving up to 50 times but with possibility of data loss.
|
|
||||||
See :ref:`backends.DbDict <backends_dbdict>` for more info
|
|
||||||
:param extension: extension for filename (default: ``'.sqlite'``)
|
|
||||||
"""
|
|
||||||
super(DbCache, self).__init__()
|
|
||||||
self.responses = DbPickleDict(location + extension, 'responses', fast_save=fast_save)
|
|
||||||
self.keys_map = DbDict(location + extension, 'urls')
|
|
||||||
|
|
@ -1,171 +0,0 @@
|
|||||||
#!/usr/bin/python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.dbdict
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Dictionary-like objects for saving large data sets to `sqlite` database
|
|
||||||
"""
|
|
||||||
from collections import MutableMapping
|
|
||||||
import sqlite3 as sqlite
|
|
||||||
from contextlib import contextmanager
|
|
||||||
try:
|
|
||||||
import threading
|
|
||||||
except ImportError:
|
|
||||||
import dummy_threading as threading
|
|
||||||
try:
|
|
||||||
import cPickle as pickle
|
|
||||||
except ImportError:
|
|
||||||
import pickle
|
|
||||||
|
|
||||||
from requests_cache.compat import bytes
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
class DbDict(MutableMapping):
|
|
||||||
""" DbDict - a dictionary-like object for saving large datasets to `sqlite` database
|
|
||||||
|
|
||||||
It's possible to create multiply DbDict instances, which will be stored as separate
|
|
||||||
tables in one database::
|
|
||||||
|
|
||||||
d1 = DbDict('test', 'table1')
|
|
||||||
d2 = DbDict('test', 'table2')
|
|
||||||
d3 = DbDict('test', 'table3')
|
|
||||||
|
|
||||||
all data will be stored in ``test.sqlite`` database into
|
|
||||||
correspondent tables: ``table1``, ``table2`` and ``table3``
|
|
||||||
"""
|
|
||||||
|
|
||||||
def __init__(self, filename, table_name='data', fast_save=False, **options):
|
|
||||||
"""
|
|
||||||
:param filename: filename for database (without extension)
|
|
||||||
:param table_name: table name
|
|
||||||
:param fast_save: If it's True, then sqlite will be configured with
|
|
||||||
`"PRAGMA synchronous = 0;" <http://www.sqlite.org/pragma.html#pragma_synchronous>`_
|
|
||||||
to speedup cache saving, but be careful, it's dangerous.
|
|
||||||
Tests showed that insertion order of records can be wrong with this option.
|
|
||||||
"""
|
|
||||||
self.filename = filename
|
|
||||||
self.table_name = table_name
|
|
||||||
self.fast_save = fast_save
|
|
||||||
|
|
||||||
#: Transactions can be commited if this property is set to `True`
|
|
||||||
self.can_commit = True
|
|
||||||
|
|
||||||
|
|
||||||
self._bulk_commit = False
|
|
||||||
self._pending_connection = None
|
|
||||||
self._lock = threading.RLock()
|
|
||||||
with self.connection() as con:
|
|
||||||
con.execute("create table if not exists `%s` (key PRIMARY KEY, value)" % self.table_name)
|
|
||||||
|
|
||||||
|
|
||||||
@contextmanager
|
|
||||||
def connection(self, commit_on_success=False):
|
|
||||||
with self._lock:
|
|
||||||
if self._bulk_commit:
|
|
||||||
if self._pending_connection is None:
|
|
||||||
self._pending_connection = sqlite.connect(self.filename)
|
|
||||||
con = self._pending_connection
|
|
||||||
else:
|
|
||||||
con = sqlite.connect(self.filename)
|
|
||||||
try:
|
|
||||||
if self.fast_save:
|
|
||||||
con.execute("PRAGMA synchronous = 0;")
|
|
||||||
yield con
|
|
||||||
if commit_on_success and self.can_commit:
|
|
||||||
con.commit()
|
|
||||||
finally:
|
|
||||||
if not self._bulk_commit:
|
|
||||||
con.close()
|
|
||||||
|
|
||||||
def commit(self, force=False):
|
|
||||||
"""
|
|
||||||
Commits pending transaction if :attr:`can_commit` or `force` is `True`
|
|
||||||
|
|
||||||
:param force: force commit, ignore :attr:`can_commit`
|
|
||||||
"""
|
|
||||||
if force or self.can_commit:
|
|
||||||
if self._pending_connection is not None:
|
|
||||||
self._pending_connection.commit()
|
|
||||||
|
|
||||||
@contextmanager
|
|
||||||
def bulk_commit(self):
|
|
||||||
"""
|
|
||||||
Context manager used to speedup insertion of big number of records
|
|
||||||
::
|
|
||||||
|
|
||||||
>>> d1 = DbDict('test')
|
|
||||||
>>> with d1.bulk_commit():
|
|
||||||
... for i in range(1000):
|
|
||||||
... d1[i] = i * 2
|
|
||||||
|
|
||||||
"""
|
|
||||||
self._bulk_commit = True
|
|
||||||
self.can_commit = False
|
|
||||||
try:
|
|
||||||
yield
|
|
||||||
self.commit(True)
|
|
||||||
finally:
|
|
||||||
self._bulk_commit = False
|
|
||||||
self.can_commit = True
|
|
||||||
self._pending_connection.close()
|
|
||||||
self._pending_connection = None
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
with self.connection() as con:
|
|
||||||
row = con.execute("select value from `%s` where key=?" %
|
|
||||||
self.table_name, (key,)).fetchone()
|
|
||||||
if not row:
|
|
||||||
raise KeyError
|
|
||||||
return row[0]
|
|
||||||
|
|
||||||
def __setitem__(self, key, item):
|
|
||||||
with self.connection(True) as con:
|
|
||||||
if con.execute("select key from `%s` where key=?" %
|
|
||||||
self.table_name, (key,)).fetchone():
|
|
||||||
con.execute("update `%s` set value=? where key=?" %
|
|
||||||
self.table_name, (item, key))
|
|
||||||
else:
|
|
||||||
con.execute("insert into `%s` (key,value) values (?,?)" %
|
|
||||||
self.table_name, (key, item))
|
|
||||||
|
|
||||||
def __delitem__(self, key):
|
|
||||||
with self.connection(True) as con:
|
|
||||||
if con.execute("select key from `%s` where key=?" %
|
|
||||||
self.table_name, (key,)).fetchone():
|
|
||||||
con.execute("delete from `%s` where key=?" %
|
|
||||||
self.table_name, (key,))
|
|
||||||
else:
|
|
||||||
raise KeyError
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
with self.connection() as con:
|
|
||||||
for row in con.execute("select key from `%s`" %
|
|
||||||
self.table_name):
|
|
||||||
yield row[0]
|
|
||||||
|
|
||||||
def __len__(self):
|
|
||||||
with self.connection() as con:
|
|
||||||
return con.execute("select count(key) from `%s`" %
|
|
||||||
self.table_name).fetchone()[0]
|
|
||||||
|
|
||||||
def clear(self):
|
|
||||||
with self.connection(True) as con:
|
|
||||||
con.execute("drop table `%s`" % self.table_name)
|
|
||||||
con.execute("create table `%s` (key PRIMARY KEY, value)" %
|
|
||||||
self.table_name)
|
|
||||||
|
|
||||||
def __str__(self):
|
|
||||||
return str(dict(self.items()))
|
|
||||||
|
|
||||||
|
|
||||||
class DbPickleDict(DbDict):
|
|
||||||
""" Same as :class:`DbDict`, but pickles values before saving
|
|
||||||
"""
|
|
||||||
def __setitem__(self, key, item):
|
|
||||||
super(DbPickleDict, self).__setitem__(key,
|
|
||||||
sqlite.Binary(pickle.dumps(item)))
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
return pickle.loads(bytes(super(DbPickleDict, self).__getitem__(key)))
|
|
@ -1,74 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.mongodict
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Dictionary-like objects for saving large data sets to ``mongodb`` database
|
|
||||||
"""
|
|
||||||
from collections import MutableMapping
|
|
||||||
try:
|
|
||||||
import cPickle as pickle
|
|
||||||
except ImportError:
|
|
||||||
import pickle
|
|
||||||
|
|
||||||
from pymongo import Connection
|
|
||||||
|
|
||||||
|
|
||||||
class MongoDict(MutableMapping):
|
|
||||||
""" MongoDict - a dictionary-like interface for ``mongo`` database
|
|
||||||
"""
|
|
||||||
def __init__(self, db_name,
|
|
||||||
collection_name='mongo_dict_data', connection=None):
|
|
||||||
"""
|
|
||||||
:param db_name: database name (be careful with production databases)
|
|
||||||
:param collection_name: collection name (default: mongo_dict_data)
|
|
||||||
:param connection: ``pymongo.Connection`` instance. If it's ``None``
|
|
||||||
(default) new connection with default options will
|
|
||||||
be created
|
|
||||||
"""
|
|
||||||
if connection is not None:
|
|
||||||
self.connection = connection
|
|
||||||
else:
|
|
||||||
self.connection = Connection()
|
|
||||||
self.db = self.connection[db_name]
|
|
||||||
self.collection = self.db[collection_name]
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
result = self.collection.find_one({'_id': key})
|
|
||||||
if result is None:
|
|
||||||
raise KeyError
|
|
||||||
return result['data']
|
|
||||||
|
|
||||||
def __setitem__(self, key, item):
|
|
||||||
self.collection.save({'_id': key, 'data': item})
|
|
||||||
|
|
||||||
def __delitem__(self, key):
|
|
||||||
spec = {'_id': key}
|
|
||||||
if self.collection.find_one(spec, fields=['_id']):
|
|
||||||
self.collection.remove(spec)
|
|
||||||
else:
|
|
||||||
raise KeyError
|
|
||||||
|
|
||||||
def __len__(self):
|
|
||||||
return self.collection.count()
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
for d in self.collection.find(fields=['_id']):
|
|
||||||
yield d['_id']
|
|
||||||
|
|
||||||
def clear(self):
|
|
||||||
self.collection.drop()
|
|
||||||
|
|
||||||
def __str__(self):
|
|
||||||
return str(dict(self.items()))
|
|
||||||
|
|
||||||
|
|
||||||
class MongoPickleDict(MongoDict):
|
|
||||||
""" Same as :class:`MongoDict`, but pickles values before saving
|
|
||||||
"""
|
|
||||||
def __setitem__(self, key, item):
|
|
||||||
super(MongoPickleDict, self).__setitem__(key, pickle.dumps(item))
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
return pickle.loads(bytes(super(MongoPickleDict, self).__getitem__(key)))
|
|
@ -1,68 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.backends.redisdict
|
|
||||||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Dictionary-like objects for saving large data sets to ``redis`` key-store
|
|
||||||
"""
|
|
||||||
from collections import MutableMapping
|
|
||||||
try:
|
|
||||||
import cPickle as pickle
|
|
||||||
except ImportError:
|
|
||||||
import pickle
|
|
||||||
from redis import StrictRedis as Redis
|
|
||||||
|
|
||||||
|
|
||||||
class RedisDict(MutableMapping):
|
|
||||||
""" RedisDict - a dictionary-like interface for ``redis`` key-stores
|
|
||||||
"""
|
|
||||||
def __init__(self, namespace, collection_name='redis_dict_data',
|
|
||||||
connection=None):
|
|
||||||
"""
|
|
||||||
The actual key name on the redis server will be
|
|
||||||
``namespace``:``collection_name``
|
|
||||||
|
|
||||||
In order to deal with how redis stores data/keys,
|
|
||||||
everything, i.e. keys and data, must be pickled.
|
|
||||||
|
|
||||||
:param namespace: namespace to use
|
|
||||||
:param collection_name: name of the hash map stored in redis
|
|
||||||
(default: redis_dict_data)
|
|
||||||
:param connection: ``redis.StrictRedis`` instance.
|
|
||||||
If it's ``None`` (default), a new connection with
|
|
||||||
default options will be created
|
|
||||||
|
|
||||||
"""
|
|
||||||
if connection is not None:
|
|
||||||
self.connection = connection
|
|
||||||
else:
|
|
||||||
self.connection = Redis()
|
|
||||||
self._self_key = ':'.join([namespace, collection_name])
|
|
||||||
|
|
||||||
def __getitem__(self, key):
|
|
||||||
result = self.connection.hget(self._self_key, pickle.dumps(key))
|
|
||||||
if result is None:
|
|
||||||
raise KeyError
|
|
||||||
return pickle.loads(bytes(result))
|
|
||||||
|
|
||||||
def __setitem__(self, key, item):
|
|
||||||
self.connection.hset(self._self_key, pickle.dumps(key),
|
|
||||||
pickle.dumps(item))
|
|
||||||
|
|
||||||
def __delitem__(self, key):
|
|
||||||
if not self.connection.hdel(self._self_key, pickle.dumps(key)):
|
|
||||||
raise KeyError
|
|
||||||
|
|
||||||
def __len__(self):
|
|
||||||
return self.connection.hlen(self._self_key)
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
for v in self.connection.hkeys(self._self_key):
|
|
||||||
yield pickle.loads(bytes(v))
|
|
||||||
|
|
||||||
def clear(self):
|
|
||||||
self.connection.delete(self._self_key)
|
|
||||||
|
|
||||||
def __str__(self):
|
|
||||||
return str(dict(self.items()))
|
|
@ -1,103 +0,0 @@
|
|||||||
# -*- coding: utf-8 -*-
|
|
||||||
# taken from requests library: https://github.com/kennethreitz/requests
|
|
||||||
"""
|
|
||||||
pythoncompat
|
|
||||||
"""
|
|
||||||
|
|
||||||
|
|
||||||
import sys
|
|
||||||
|
|
||||||
# -------
|
|
||||||
# Pythons
|
|
||||||
# -------
|
|
||||||
|
|
||||||
# Syntax sugar.
|
|
||||||
_ver = sys.version_info
|
|
||||||
|
|
||||||
#: Python 2.x?
|
|
||||||
is_py2 = (_ver[0] == 2)
|
|
||||||
|
|
||||||
#: Python 3.x?
|
|
||||||
is_py3 = (_ver[0] == 3)
|
|
||||||
|
|
||||||
#: Python 3.0.x
|
|
||||||
is_py30 = (is_py3 and _ver[1] == 0)
|
|
||||||
|
|
||||||
#: Python 3.1.x
|
|
||||||
is_py31 = (is_py3 and _ver[1] == 1)
|
|
||||||
|
|
||||||
#: Python 3.2.x
|
|
||||||
is_py32 = (is_py3 and _ver[1] == 2)
|
|
||||||
|
|
||||||
#: Python 3.3.x
|
|
||||||
is_py33 = (is_py3 and _ver[1] == 3)
|
|
||||||
|
|
||||||
#: Python 3.4.x
|
|
||||||
is_py34 = (is_py3 and _ver[1] == 4)
|
|
||||||
|
|
||||||
#: Python 2.7.x
|
|
||||||
is_py27 = (is_py2 and _ver[1] == 7)
|
|
||||||
|
|
||||||
#: Python 2.6.x
|
|
||||||
is_py26 = (is_py2 and _ver[1] == 6)
|
|
||||||
|
|
||||||
#: Python 2.5.x
|
|
||||||
is_py25 = (is_py2 and _ver[1] == 5)
|
|
||||||
|
|
||||||
#: Python 2.4.x
|
|
||||||
is_py24 = (is_py2 and _ver[1] == 4) # I'm assuming this is not by choice.
|
|
||||||
|
|
||||||
|
|
||||||
# ---------
|
|
||||||
# Platforms
|
|
||||||
# ---------
|
|
||||||
|
|
||||||
|
|
||||||
# Syntax sugar.
|
|
||||||
_ver = sys.version.lower()
|
|
||||||
|
|
||||||
is_pypy = ('pypy' in _ver)
|
|
||||||
is_jython = ('jython' in _ver)
|
|
||||||
is_ironpython = ('iron' in _ver)
|
|
||||||
|
|
||||||
# Assume CPython, if nothing else.
|
|
||||||
is_cpython = not any((is_pypy, is_jython, is_ironpython))
|
|
||||||
|
|
||||||
# Windows-based system.
|
|
||||||
is_windows = 'win32' in str(sys.platform).lower()
|
|
||||||
|
|
||||||
# Standard Linux 2+ system.
|
|
||||||
is_linux = ('linux' in str(sys.platform).lower())
|
|
||||||
is_osx = ('darwin' in str(sys.platform).lower())
|
|
||||||
is_hpux = ('hpux' in str(sys.platform).lower()) # Complete guess.
|
|
||||||
is_solaris = ('solar==' in str(sys.platform).lower()) # Complete guess.
|
|
||||||
|
|
||||||
|
|
||||||
# ---------
|
|
||||||
# Specifics
|
|
||||||
# ---------
|
|
||||||
|
|
||||||
|
|
||||||
if is_py2:
|
|
||||||
from urllib import quote, unquote, urlencode
|
|
||||||
from urlparse import urlparse, urlunparse, urljoin, urlsplit
|
|
||||||
from urllib2 import parse_http_list
|
|
||||||
import cookielib
|
|
||||||
from StringIO import StringIO
|
|
||||||
bytes = str
|
|
||||||
str = unicode
|
|
||||||
basestring = basestring
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
elif is_py3:
|
|
||||||
from urllib.parse import urlparse, urlunparse, urljoin, urlsplit, urlencode, quote, unquote
|
|
||||||
from urllib.request import parse_http_list
|
|
||||||
from http import cookiejar as cookielib
|
|
||||||
from http.cookies import SimpleCookie
|
|
||||||
from io import StringIO
|
|
||||||
|
|
||||||
str = str
|
|
||||||
bytes = bytes
|
|
||||||
basestring = (str,bytes)
|
|
||||||
|
|
@ -1,227 +0,0 @@
|
|||||||
#!/usr/bin/env python
|
|
||||||
# -*- coding: utf-8 -*-
|
|
||||||
"""
|
|
||||||
requests_cache.core
|
|
||||||
~~~~~~~~~~~~~~~~~~~
|
|
||||||
|
|
||||||
Core functions for configuring cache and monkey patching ``requests``
|
|
||||||
"""
|
|
||||||
from contextlib import contextmanager
|
|
||||||
from datetime import datetime, timedelta
|
|
||||||
|
|
||||||
import requests
|
|
||||||
from requests import Session as OriginalSession
|
|
||||||
from requests.hooks import dispatch_hook
|
|
||||||
|
|
||||||
from requests_cache import backends
|
|
||||||
from requests_cache.compat import str, basestring
|
|
||||||
|
|
||||||
try:
|
|
||||||
ver = tuple(map(int, requests.__version__.split(".")))
|
|
||||||
except ValueError:
|
|
||||||
pass
|
|
||||||
else:
|
|
||||||
# We don't need to dispatch hook in Requests <= 1.1.0
|
|
||||||
if ver < (1, 2, 0):
|
|
||||||
dispatch_hook = lambda key, hooks, hook_data, *a, **kw: hook_data
|
|
||||||
del ver
|
|
||||||
|
|
||||||
|
|
||||||
class CachedSession(OriginalSession):
|
|
||||||
""" Requests ``Sessions`` with caching support.
|
|
||||||
"""
|
|
||||||
|
|
||||||
def __init__(self, cache_name='cache', backend=None, expire_after=None,
|
|
||||||
allowable_codes=(200,), allowable_methods=('GET',),
|
|
||||||
**backend_options):
|
|
||||||
"""
|
|
||||||
:param cache_name: for ``sqlite`` backend: cache file will start with this prefix,
|
|
||||||
e.g ``cache.sqlite``
|
|
||||||
|
|
||||||
for ``mongodb``: it's used as database name
|
|
||||||
|
|
||||||
for ``redis``: it's used as the namespace. This means all keys
|
|
||||||
are prefixed with ``'cache_name:'``
|
|
||||||
:param backend: cache backend name e.g ``'sqlite'``, ``'mongodb'``, ``'redis'``, ``'memory'``.
|
|
||||||
(see :ref:`persistence`). Or instance of backend implementation.
|
|
||||||
Default value is ``None``, which means use ``'sqlite'`` if available,
|
|
||||||
otherwise fallback to ``'memory'``.
|
|
||||||
:param expire_after: number of seconds after cache will be expired
|
|
||||||
or `None` (default) to ignore expiration
|
|
||||||
:type expire_after: float
|
|
||||||
:param allowable_codes: limit caching only for response with this codes (default: 200)
|
|
||||||
:type allowable_codes: tuple
|
|
||||||
:param allowable_methods: cache only requests of this methods (default: 'GET')
|
|
||||||
:type allowable_methods: tuple
|
|
||||||
:kwarg backend_options: options for chosen backend. See corresponding
|
|
||||||
:ref:`sqlite <backends_sqlite>`, :ref:`mongo <backends_mongo>`
|
|
||||||
and :ref:`redis <backends_redis>` backends API documentation
|
|
||||||
"""
|
|
||||||
if backend is None or isinstance(backend, basestring):
|
|
||||||
self.cache = backends.create_backend(backend, cache_name,
|
|
||||||
backend_options)
|
|
||||||
else:
|
|
||||||
self.cache = backend
|
|
||||||
|
|
||||||
self._cache_expire_after = expire_after
|
|
||||||
self._cache_allowable_codes = allowable_codes
|
|
||||||
self._cache_allowable_methods = allowable_methods
|
|
||||||
self._is_cache_disabled = False
|
|
||||||
super(CachedSession, self).__init__()
|
|
||||||
|
|
||||||
def send(self, request, **kwargs):
|
|
||||||
if (self._is_cache_disabled
|
|
||||||
or request.method not in self._cache_allowable_methods):
|
|
||||||
response = super(CachedSession, self).send(request, **kwargs)
|
|
||||||
response.from_cache = False
|
|
||||||
return response
|
|
||||||
|
|
||||||
cache_key = self.cache.create_key(request)
|
|
||||||
|
|
||||||
def send_request_and_cache_response():
|
|
||||||
response = super(CachedSession, self).send(request, **kwargs)
|
|
||||||
if response.status_code in self._cache_allowable_codes:
|
|
||||||
self.cache.save_response(cache_key, response)
|
|
||||||
response.from_cache = False
|
|
||||||
return response
|
|
||||||
|
|
||||||
response, timestamp = self.cache.get_response_and_time(cache_key)
|
|
||||||
if response is None:
|
|
||||||
return send_request_and_cache_response()
|
|
||||||
|
|
||||||
if self._cache_expire_after is not None:
|
|
||||||
difference = datetime.utcnow() - timestamp
|
|
||||||
if difference > timedelta(seconds=self._cache_expire_after):
|
|
||||||
self.cache.delete(cache_key)
|
|
||||||
return send_request_and_cache_response()
|
|
||||||
# dispatch hook here, because we've removed it before pickling
|
|
||||||
response.from_cache = True
|
|
||||||
response = dispatch_hook('response', request.hooks, response, **kwargs)
|
|
||||||
return response
|
|
||||||
|
|
||||||
def request(self, method, url, params=None, data=None, headers=None,
|
|
||||||
cookies=None, files=None, auth=None, timeout=None,
|
|
||||||
allow_redirects=True, proxies=None, hooks=None, stream=None,
|
|
||||||
verify=None, cert=None):
|
|
||||||
response = super(CachedSession, self).request(method, url, params, data,
|
|
||||||
headers, cookies, files,
|
|
||||||
auth, timeout,
|
|
||||||
allow_redirects, proxies,
|
|
||||||
hooks, stream, verify, cert)
|
|
||||||
if self._is_cache_disabled:
|
|
||||||
return response
|
|
||||||
|
|
||||||
main_key = self.cache.create_key(response.request)
|
|
||||||
for r in response.history:
|
|
||||||
self.cache.add_key_mapping(
|
|
||||||
self.cache.create_key(r.request), main_key
|
|
||||||
)
|
|
||||||
return response
|
|
||||||
|
|
||||||
@contextmanager
|
|
||||||
def cache_disabled(self):
|
|
||||||
"""
|
|
||||||
Context manager for temporary disabling cache
|
|
||||||
::
|
|
||||||
|
|
||||||
>>> s = CachedSession()
|
|
||||||
>>> with s.cache_disabled():
|
|
||||||
... s.get('http://httpbin.org/ip')
|
|
||||||
"""
|
|
||||||
self._is_cache_disabled = True
|
|
||||||
try:
|
|
||||||
yield
|
|
||||||
finally:
|
|
||||||
self._is_cache_disabled = False
|
|
||||||
|
|
||||||
|
|
||||||
def install_cache(cache_name='cache', backend=None, expire_after=None,
|
|
||||||
allowable_codes=(200,), allowable_methods=('GET',),
|
|
||||||
session_factory=CachedSession, **backend_options):
|
|
||||||
"""
|
|
||||||
Installs cache for all ``Requests`` requests by monkey-patching ``Session``
|
|
||||||
|
|
||||||
Parameters are the same as in :class:`CachedSession`. Additional parameters:
|
|
||||||
|
|
||||||
:param session_factory: Session factory. It should inherit :class:`CachedSession` (default)
|
|
||||||
"""
|
|
||||||
if backend:
|
|
||||||
backend = backends.create_backend(backend, cache_name, backend_options)
|
|
||||||
_patch_session_factory(
|
|
||||||
lambda : session_factory(cache_name=cache_name,
|
|
||||||
backend=backend,
|
|
||||||
expire_after=expire_after,
|
|
||||||
allowable_codes=allowable_codes,
|
|
||||||
allowable_methods=allowable_methods,
|
|
||||||
**backend_options)
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
# backward compatibility
|
|
||||||
configure = install_cache
|
|
||||||
|
|
||||||
|
|
||||||
def uninstall_cache():
|
|
||||||
""" Restores ``requests.Session`` and disables cache
|
|
||||||
"""
|
|
||||||
_patch_session_factory(OriginalSession)
|
|
||||||
|
|
||||||
|
|
||||||
@contextmanager
|
|
||||||
def disabled():
|
|
||||||
"""
|
|
||||||
Context manager for temporary disabling globally installed cache
|
|
||||||
|
|
||||||
.. warning:: not thread-safe
|
|
||||||
|
|
||||||
::
|
|
||||||
|
|
||||||
>>> with requests_cache.disabled():
|
|
||||||
... requests.get('http://httpbin.org/ip')
|
|
||||||
... requests.get('http://httpbin.org/get')
|
|
||||||
|
|
||||||
"""
|
|
||||||
previous = requests.Session
|
|
||||||
uninstall_cache()
|
|
||||||
try:
|
|
||||||
yield
|
|
||||||
finally:
|
|
||||||
_patch_session_factory(previous)
|
|
||||||
|
|
||||||
|
|
||||||
@contextmanager
|
|
||||||
def enabled(*args, **kwargs):
|
|
||||||
"""
|
|
||||||
Context manager for temporary installing global cache.
|
|
||||||
|
|
||||||
Accepts same arguments as :func:`install_cache`
|
|
||||||
|
|
||||||
.. warning:: not thread-safe
|
|
||||||
|
|
||||||
::
|
|
||||||
|
|
||||||
>>> with requests_cache.enabled('cache_db'):
|
|
||||||
... requests.get('http://httpbin.org/get')
|
|
||||||
|
|
||||||
"""
|
|
||||||
install_cache(*args, **kwargs)
|
|
||||||
try:
|
|
||||||
yield
|
|
||||||
finally:
|
|
||||||
uninstall_cache()
|
|
||||||
|
|
||||||
|
|
||||||
def get_cache():
|
|
||||||
""" Returns internal cache object from globally installed ``CachedSession``
|
|
||||||
"""
|
|
||||||
return requests.Session().cache
|
|
||||||
|
|
||||||
|
|
||||||
def clear():
|
|
||||||
""" Clears globally installed cache
|
|
||||||
"""
|
|
||||||
get_cache().clear()
|
|
||||||
|
|
||||||
|
|
||||||
def _patch_session_factory(session_factory=CachedSession):
|
|
||||||
requests.Session = requests.sessions.Session = session_factory
|
|
@ -37,15 +37,13 @@ except ImportError:
|
|||||||
gzip = None
|
gzip = None
|
||||||
|
|
||||||
from lib import requests
|
from lib import requests
|
||||||
from lib import requests_cache
|
from lib import cachecontrol
|
||||||
|
from lib.cachecontrol import caches
|
||||||
|
|
||||||
from tvdb_ui import BaseUI, ConsoleUI
|
from tvdb_ui import BaseUI, ConsoleUI
|
||||||
from tvdb_exceptions import (tvdb_error, tvdb_userabort, tvdb_shownotfound,
|
from tvdb_exceptions import (tvdb_error, tvdb_userabort, tvdb_shownotfound,
|
||||||
tvdb_seasonnotfound, tvdb_episodenotfound, tvdb_attributenotfound)
|
tvdb_seasonnotfound, tvdb_episodenotfound, tvdb_attributenotfound)
|
||||||
|
|
||||||
# Cached Session Handler
|
|
||||||
from lib.httpcache import CachingHTTPAdapter
|
|
||||||
|
|
||||||
def log():
|
def log():
|
||||||
return logging.getLogger("tvdb_api")
|
return logging.getLogger("tvdb_api")
|
||||||
|
|
||||||
@ -429,12 +427,14 @@ class Tvdb:
|
|||||||
|
|
||||||
if cache is True:
|
if cache is True:
|
||||||
self.config['cache_enabled'] = True
|
self.config['cache_enabled'] = True
|
||||||
requests_cache.install_cache(self._getTempDir())
|
self.sess = cachecontrol.CacheControl(requests.Session(),
|
||||||
|
cache=caches.FileCache(self._getTempDir()), cache_all=True)
|
||||||
elif cache is False:
|
elif cache is False:
|
||||||
self.config['cache_enabled'] = False
|
self.config['cache_enabled'] = False
|
||||||
elif isinstance(cache, basestring):
|
elif isinstance(cache, basestring):
|
||||||
self.config['cache_enabled'] = True
|
self.config['cache_enabled'] = True
|
||||||
requests_cache.install_cache(cache)
|
self.sess = cachecontrol.CacheControl(requests.Session(),
|
||||||
|
cache=caches.FileCache(cache), cache_all=True)
|
||||||
else:
|
else:
|
||||||
raise ValueError("Invalid value for Cache %r (type was %s)" % (cache, type(cache)))
|
raise ValueError("Invalid value for Cache %r (type was %s)" % (cache, type(cache)))
|
||||||
|
|
||||||
@ -537,10 +537,9 @@ class Tvdb:
|
|||||||
|
|
||||||
# get response from TVDB
|
# get response from TVDB
|
||||||
if self.config['cache_enabled']:
|
if self.config['cache_enabled']:
|
||||||
resp = requests.get(url, params=params)
|
resp = self.sess.get(url, params=sorted(params))
|
||||||
else:
|
else:
|
||||||
with requests_cache.disabled():
|
resp = requests.get(url, params=params)
|
||||||
resp = requests.get(url, params=params)
|
|
||||||
|
|
||||||
except requests.HTTPError, e:
|
except requests.HTTPError, e:
|
||||||
raise tvdb_error("HTTP error " + str(e.errno) + " while loading URL " + str(url))
|
raise tvdb_error("HTTP error " + str(e.errno) + " while loading URL " + str(url))
|
||||||
|
@ -32,15 +32,13 @@ except ImportError:
|
|||||||
from lib.dateutil.parser import parse
|
from lib.dateutil.parser import parse
|
||||||
|
|
||||||
from lib import requests
|
from lib import requests
|
||||||
from lib import requests_cache
|
from lib import cachecontrol
|
||||||
|
from lib.cachecontrol import caches
|
||||||
|
|
||||||
from tvrage_ui import BaseUI
|
from tvrage_ui import BaseUI
|
||||||
from tvrage_exceptions import (tvrage_error, tvrage_userabort, tvrage_shownotfound,
|
from tvrage_exceptions import (tvrage_error, tvrage_userabort, tvrage_shownotfound,
|
||||||
tvrage_seasonnotfound, tvrage_episodenotfound, tvrage_attributenotfound)
|
tvrage_seasonnotfound, tvrage_episodenotfound, tvrage_attributenotfound)
|
||||||
|
|
||||||
# Cached Session Handler
|
|
||||||
from lib.httpcache import CachingHTTPAdapter
|
|
||||||
|
|
||||||
def log():
|
def log():
|
||||||
return logging.getLogger("tvrage_api")
|
return logging.getLogger("tvrage_api")
|
||||||
|
|
||||||
@ -272,12 +270,14 @@ class TVRage:
|
|||||||
|
|
||||||
if cache is True:
|
if cache is True:
|
||||||
self.config['cache_enabled'] = True
|
self.config['cache_enabled'] = True
|
||||||
requests_cache.install_cache(self._getTempDir())
|
self.sess = cachecontrol.CacheControl(requests.Session(),
|
||||||
|
cache=caches.FileCache(self._getTempDir()), cache_all=True)
|
||||||
elif cache is False:
|
elif cache is False:
|
||||||
self.config['cache_enabled'] = False
|
self.config['cache_enabled'] = False
|
||||||
elif isinstance(cache, basestring):
|
elif isinstance(cache, basestring):
|
||||||
self.config['cache_enabled'] = True
|
self.config['cache_enabled'] = True
|
||||||
requests_cache.install_cache(cache)
|
self.sess = cachecontrol.CacheControl(requests.Session(),
|
||||||
|
cache=caches.FileCache(cache), cache_all=True)
|
||||||
else:
|
else:
|
||||||
raise ValueError("Invalid value for Cache %r (type was %s)" % (cache, type(cache)))
|
raise ValueError("Invalid value for Cache %r (type was %s)" % (cache, type(cache)))
|
||||||
|
|
||||||
@ -370,10 +370,9 @@ class TVRage:
|
|||||||
|
|
||||||
# get response from TVRage
|
# get response from TVRage
|
||||||
if self.config['cache_enabled']:
|
if self.config['cache_enabled']:
|
||||||
resp = requests.get(url, params=params)
|
resp = self.sess.get(url, params=params)
|
||||||
else:
|
else:
|
||||||
with requests_cache.disabled():
|
resp = requests.get(url, params=params)
|
||||||
resp = requests.get(url, params=params)
|
|
||||||
|
|
||||||
except requests.HTTPError, e:
|
except requests.HTTPError, e:
|
||||||
raise tvrage_error("HTTP error " + str(e.errno) + " while loading URL " + str(url))
|
raise tvrage_error("HTTP error " + str(e.errno) + " while loading URL " + str(url))
|
||||||
|
Loading…
Reference in New Issue
Block a user