420 lines
14 KiB
Python
Raw Normal View History

2012-10-22 14:34:12 -05:00
"""
A simple JSON REST request abstraction layer that is used by the
2017-01-05 10:37:41 -06:00
``dropbox.client`` and ``dropbox.session`` modules. You shouldn't need to use this.
2012-10-22 14:34:12 -05:00
"""
2017-01-05 10:37:41 -06:00
import io
2012-10-22 14:34:12 -05:00
import socket
import ssl
import sys
import urllib
2017-01-05 10:37:41 -06:00
import pkg_resources
2012-10-22 14:34:12 -05:00
try:
import json
except ImportError:
import simplejson as json
2017-01-05 10:37:41 -06:00
try:
import requests.packages.urllib3 as urllib3
except ImportError:
raise ImportError('Dropbox python client requires urllib3.')
SDK_VERSION = "2.2.0"
2012-10-22 14:34:12 -05:00
TRUSTED_CERT_FILE = pkg_resources.resource_filename(__name__, 'trusted-certs.crt')
2017-01-05 10:37:41 -06:00
class RESTResponse(io.IOBase):
2012-10-22 14:34:12 -05:00
"""
2017-01-05 10:37:41 -06:00
Responses to requests can come in the form of ``RESTResponse``. These are
thin wrappers around the socket file descriptor.
:meth:`read()` and :meth:`close()` are implemented.
It is important to call :meth:`close()` to return the connection
back to the connection pool to be reused. If a connection
is not closed by the caller it may leak memory. The object makes a
best-effort attempt upon destruction to call :meth:`close()`,
but it's still best to explicitly call :meth:`close()`.
2012-10-22 14:34:12 -05:00
"""
2017-01-05 10:37:41 -06:00
def __init__(self, resp):
# arg: A urllib3.HTTPResponse object
self.urllib3_response = resp
self.status = resp.status
self.version = resp.version
self.reason = resp.reason
self.strict = resp.strict
self.is_closed = False
def __del__(self):
# Attempt to close when ref-count goes to zero.
self.close()
def __exit__(self, typ, value, traceback):
# Allow this to be used in "with" blocks.
self.close()
# -----------------
# Important methods
# -----------------
def read(self, amt=None):
"""
Read data off the underlying socket.
Parameters
amt
Amount of data to read. Defaults to ``None``, indicating to read
everything.
Returns
Data off the socket. If ``amt`` is not ``None``, at most ``amt`` bytes are returned.
An empty string when the socket has no data.
Raises
``ValueError``
If the ``RESTResponse`` has already been closed.
"""
if self.is_closed:
raise ValueError('Response already closed')
return self.urllib3_response.read(amt)
BLOCKSIZE = 4 * 1024 * 1024 # 4MB at a time just because
def close(self):
"""Closes the underlying socket."""
# Double closing is harmless
if self.is_closed:
return
# Read any remaining crap off the socket before releasing the
# connection. Buffer it just in case it's huge
while self.read(RESTResponse.BLOCKSIZE):
pass
# Mark as closed and release the connection (exactly once)
self.is_closed = True
self.urllib3_response.release_conn()
@property
def closed(self):
return self.is_closed
# ---------------------------------
# Backwards compat for HTTPResponse
# ---------------------------------
def getheaders(self):
"""Returns a dictionary of the response headers."""
return self.urllib3_response.getheaders()
def getheader(self, name, default=None):
"""Returns a given response header."""
return self.urllib3_response.getheader(name, default)
# Some compat functions showed up recently in urllib3
try:
urllib3.HTTPResponse.flush
urllib3.HTTPResponse.fileno
def fileno(self):
return self.urllib3_response.fileno()
def flush(self):
return self.urllib3_response.flush()
except AttributeError:
pass
2012-10-22 14:34:12 -05:00
def create_connection(address):
host, port = address
err = None
for res in socket.getaddrinfo(host, port, 0, socket.SOCK_STREAM):
af, socktype, proto, canonname, sa = res
sock = None
try:
sock = socket.socket(af, socktype, proto)
sock.connect(sa)
return sock
2017-01-05 10:37:41 -06:00
except socket.error as e:
err = e
2012-10-22 14:34:12 -05:00
if sock is not None:
sock.close()
if err is not None:
raise err
else:
raise socket.error("getaddrinfo returns an empty list")
def json_loadb(data):
if sys.version_info >= (3,):
data = data.decode('utf8')
return json.loads(data)
2017-01-05 10:37:41 -06:00
2012-10-22 14:34:12 -05:00
class RESTClientObject(object):
2017-01-05 10:37:41 -06:00
def __init__(self, max_reusable_connections=8, mock_urlopen=None):
"""
Parameters
max_reusable_connections
max connections to keep alive in the pool
mock_urlopen
an optional alternate urlopen function for testing
This class uses ``urllib3`` to maintain a pool of connections. We attempt
to grab an existing idle connection from the pool, otherwise we spin
up a new connection. Once a connection is closed, it is reinserted
into the pool (unless the pool is full).
SSL settings:
- Certificates validated using Dropbox-approved trusted root certs
- TLS v1.0 (newer TLS versions are not supported by urllib3)
- Default ciphersuites. Choosing ciphersuites is not supported by urllib3
- Hostname verification is provided by urllib3
"""
self.mock_urlopen = mock_urlopen
self.pool_manager = urllib3.PoolManager(
num_pools=4, # only a handful of hosts. api.dropbox.com, api-content.dropbox.com
maxsize=max_reusable_connections,
block=False,
timeout=60.0, # long enough so datastores await doesn't get interrupted
cert_reqs=ssl.CERT_REQUIRED,
ca_certs=TRUSTED_CERT_FILE,
ssl_version=ssl.PROTOCOL_TLSv1,
)
2012-10-22 14:34:12 -05:00
def request(self, method, url, post_params=None, body=None, headers=None, raw_response=False):
2017-01-05 10:37:41 -06:00
"""Performs a REST request. See :meth:`RESTClient.request()` for detailed description."""
2012-10-22 14:34:12 -05:00
post_params = post_params or {}
headers = headers or {}
headers['User-Agent'] = 'OfficialDropboxPythonSDK/' + SDK_VERSION
if post_params:
if body:
raise ValueError("body parameter cannot be used with post_params parameter")
2017-01-05 10:37:41 -06:00
body = params_to_urlencoded(post_params)
2012-10-22 14:34:12 -05:00
headers["Content-type"] = "application/x-www-form-urlencoded"
2017-01-05 10:37:41 -06:00
# Handle StringIO instances, because urllib3 doesn't.
if hasattr(body, 'getvalue'):
body = str(body.getvalue())
headers["Content-Length"] = len(body)
2012-10-22 14:34:12 -05:00
2017-01-05 10:37:41 -06:00
# Reject any headers containing newlines; the error from the server isn't pretty.
for key, value in headers.items():
if isinstance(value, basestring) and '\n' in value:
raise ValueError("headers should not contain newlines (%s: %s)" %
(key, value))
2012-10-22 14:34:12 -05:00
try:
2017-01-05 10:37:41 -06:00
# Grab a connection from the pool to make the request.
# We return it to the pool when caller close() the response
urlopen = self.mock_urlopen if self.mock_urlopen else self.pool_manager.urlopen
r = urlopen(
method=method,
url=url,
body=body,
headers=headers,
preload_content=False
)
r = RESTResponse(r) # wrap up the urllib3 response before proceeding
except socket.error as e:
raise RESTSocketError(url, e)
except urllib3.exceptions.SSLError as e:
raise RESTSocketError(url, "SSL certificate error: %s" % e)
if r.status not in (200, 206):
raise ErrorResponse(r, r.read())
return self.process_response(r, raw_response)
def process_response(self, r, raw_response):
2012-10-22 14:34:12 -05:00
if raw_response:
return r
else:
2017-01-05 10:37:41 -06:00
s = r.read()
2012-10-22 14:34:12 -05:00
try:
2017-01-05 10:37:41 -06:00
resp = json_loadb(s)
2012-10-22 14:34:12 -05:00
except ValueError:
2017-01-05 10:37:41 -06:00
raise ErrorResponse(r, s)
r.close()
2012-10-22 14:34:12 -05:00
return resp
def GET(self, url, headers=None, raw_response=False):
assert type(raw_response) == bool
return self.request("GET", url, headers=headers, raw_response=raw_response)
def POST(self, url, params=None, headers=None, raw_response=False):
assert type(raw_response) == bool
if params is None:
params = {}
return self.request("POST", url,
post_params=params, headers=headers, raw_response=raw_response)
def PUT(self, url, body, headers=None, raw_response=False):
assert type(raw_response) == bool
return self.request("PUT", url, body=body, headers=headers, raw_response=raw_response)
2017-01-05 10:37:41 -06:00
class RESTClient(object):
2012-10-22 14:34:12 -05:00
"""
2017-01-05 10:37:41 -06:00
A class with all static methods to perform JSON REST requests that is used internally
2012-10-22 14:34:12 -05:00
by the Dropbox Client API. It provides just enough gear to make requests
and get responses as JSON data (when applicable). All requests happen over SSL.
"""
2017-01-05 10:37:41 -06:00
IMPL = RESTClientObject()
2012-10-22 14:34:12 -05:00
@classmethod
def request(cls, *n, **kw):
"""Perform a REST request and parse the response.
2017-01-05 10:37:41 -06:00
Parameters
method
An HTTP method (e.g. ``'GET'`` or ``'POST'``).
url
The URL to make a request to.
post_params
A dictionary of parameters to put in the body of the request.
2012-10-22 14:34:12 -05:00
This option may not be used if the body parameter is given.
2017-01-05 10:37:41 -06:00
body
The body of the request. Typically, this value will be a string.
It may also be a file-like object. The body
2012-10-22 14:34:12 -05:00
parameter may not be used with the post_params parameter.
2017-01-05 10:37:41 -06:00
headers
A dictionary of headers to send with the request.
raw_response
Whether to return a :class:`RESTResponse` object. Default ``False``.
2012-10-22 14:34:12 -05:00
It's best enabled for requests that return large amounts of data that you
2017-01-05 10:37:41 -06:00
would want to ``.read()`` incrementally rather than loading into memory. Also
2012-10-22 14:34:12 -05:00
use this for calls where you need to read metadata like status or headers,
or if the body is not JSON.
2017-01-05 10:37:41 -06:00
Returns
The JSON-decoded data from the server, unless ``raw_response`` is
set, in which case a :class:`RESTResponse` object is returned instead.
2012-10-22 14:34:12 -05:00
2017-01-05 10:37:41 -06:00
Raises
:class:`ErrorResponse`
The returned HTTP status is not 200, or the body was
2012-10-22 14:34:12 -05:00
not parsed from JSON successfully.
2017-01-05 10:37:41 -06:00
:class:`RESTSocketError`
A ``socket.error`` was raised while contacting Dropbox.
2012-10-22 14:34:12 -05:00
"""
return cls.IMPL.request(*n, **kw)
@classmethod
def GET(cls, *n, **kw):
2017-01-05 10:37:41 -06:00
"""Perform a GET request using :meth:`RESTClient.request()`."""
2012-10-22 14:34:12 -05:00
return cls.IMPL.GET(*n, **kw)
@classmethod
def POST(cls, *n, **kw):
2017-01-05 10:37:41 -06:00
"""Perform a POST request using :meth:`RESTClient.request()`."""
2012-10-22 14:34:12 -05:00
return cls.IMPL.POST(*n, **kw)
@classmethod
def PUT(cls, *n, **kw):
2017-01-05 10:37:41 -06:00
"""Perform a PUT request using :meth:`RESTClient.request()`."""
2012-10-22 14:34:12 -05:00
return cls.IMPL.PUT(*n, **kw)
2017-01-05 10:37:41 -06:00
2012-10-22 14:34:12 -05:00
class RESTSocketError(socket.error):
2017-01-05 10:37:41 -06:00
"""A light wrapper for ``socket.error`` that adds some more information."""
2012-10-22 14:34:12 -05:00
def __init__(self, host, e):
msg = "Error connecting to \"%s\": %s" % (host, str(e))
socket.error.__init__(self, msg)
2017-01-05 10:37:41 -06:00
# Dummy class for docstrings, see doco.py.
class _ErrorResponse__doc__(Exception):
"""Exception raised when :class:`DropboxClient` exeriences a problem.
For example, this is raised when the server returns an unexpected
non-200 HTTP response.
"""
_status__doc__ = "HTTP response status (an int)."
_reason__doc__ = "HTTP response reason (a string)."
_headers__doc__ = "HTTP response headers (a list of (header, value) tuples)."
_body__doc__ = "HTTP response body (string or JSON dict)."
_error_msg__doc__ = "Error message for developer (optional)."
_user_error_msg__doc__ = "Error message for end user (optional)."
2012-10-22 14:34:12 -05:00
class ErrorResponse(Exception):
"""
2017-01-05 10:37:41 -06:00
Raised by :meth:`RESTClient.request()` for requests that:
2012-10-22 14:34:12 -05:00
2017-01-05 10:37:41 -06:00
- Return a non-200 HTTP response, or
- Have a non-JSON response body, or
- Have a malformed/missing header in the response.
Most errors that Dropbox returns will have an error field that is unpacked and
2012-10-22 14:34:12 -05:00
placed on the ErrorResponse exception. In some situations, a user_error field
will also come back. Messages under user_error are worth showing to an end-user
of your app, while other errors are likely only useful for you as the developer.
"""
2017-01-05 10:37:41 -06:00
def __init__(self, http_resp, body):
"""
Parameters
http_resp
The :class:`RESTResponse` which errored
body
Body of the :class:`RESTResponse`.
The reason we can't simply call ``http_resp.read()`` to
get the body, is that ``read()`` is not idempotent.
Since it can't be called more than once,
we have to pass the string body in separately
"""
2012-10-22 14:34:12 -05:00
self.status = http_resp.status
self.reason = http_resp.reason
2017-01-05 10:37:41 -06:00
self.body = body
2012-10-22 14:34:12 -05:00
self.headers = http_resp.getheaders()
2017-01-05 10:37:41 -06:00
http_resp.close() # won't need this connection anymore
2012-10-22 14:34:12 -05:00
try:
self.body = json_loadb(self.body)
self.error_msg = self.body.get('error')
self.user_error_msg = self.body.get('user_error')
except ValueError:
self.error_msg = None
self.user_error_msg = None
def __str__(self):
if self.user_error_msg and self.user_error_msg != self.error_msg:
# one is translated and the other is English
2017-01-05 10:37:41 -06:00
msg = "%r (%r)" % (self.user_error_msg, self.error_msg)
2012-10-22 14:34:12 -05:00
elif self.error_msg:
2017-01-05 10:37:41 -06:00
msg = repr(self.error_msg)
2012-10-22 14:34:12 -05:00
elif not self.body:
2017-01-05 10:37:41 -06:00
msg = repr(self.reason)
2012-10-22 14:34:12 -05:00
else:
msg = "Error parsing response body or headers: " +\
2017-01-05 10:37:41 -06:00
"Body - %.100r Headers - %r" % (self.body, self.headers)
return "[%d] %s" % (self.status, msg)
2012-10-22 14:34:12 -05:00
2017-01-05 10:37:41 -06:00
def params_to_urlencoded(params):
"""
Returns a application/x-www-form-urlencoded 'str' representing the key/value pairs in 'params'.
Keys are values are str()'d before calling urllib.urlencode, with the exception of unicode
objects which are utf8-encoded.
"""
def encode(o):
if isinstance(o, unicode):
return o.encode('utf8')
else:
return str(o)
2017-01-23 09:57:01 -06:00
utf8_params={}
for k, v in params.iteritems():
utf8_params[encode(k)]= encode(v)
2017-01-05 10:37:41 -06:00
return urllib.urlencode(utf8_params)