Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

#15: Add storage.batch.Batch #654

Merged
merged 9 commits into from
Feb 26, 2015
185 changes: 185 additions & 0 deletions gcloud/storage/batch.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,185 @@
# Copyright 2014 Google Inc. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Batch updates / deletes of storage buckets / blobs.

See: https://cloud.google.com/storage/docs/json_api/v1/how-tos/batch
"""
from email.encoders import encode_noop
from email.generator import Generator
from email.mime.application import MIMEApplication
from email.mime.multipart import MIMEMultipart
from email.parser import Parser
import io
import json

import six

from gcloud._localstack import _LocalStack
from gcloud.storage.connection import Connection


_BATCHES = _LocalStack()


class MIMEApplicationHTTP(MIMEApplication):
"""MIME type for ``application/http``.

Constructs payload from headers and body

:type headers: dict
:param headers: HTTP headers

:type body: text or None
:param body: HTTP payload
"""
def __init__(self, method, uri, headers, body):
if isinstance(body, dict):
body = json.dumps(body)
headers['Content-Type'] = 'application/json'
headers['Content-Length'] = len(body)
if body is None:
body = ''
lines = ['%s %s HTTP/1.1' % (method, uri)]

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

lines.extend(['%s: %s' % (key, value)
for key, value in sorted(headers.items())])
lines.append('')
lines.append(body)
payload = '\r\n'.join(lines)
if six.PY2: # pragma: NO COVER Python2
# Sigh. email.message.Message is an old-style class, so we
# cannot use 'super()'.
MIMEApplication.__init__(self, payload, 'http', encode_noop)
else: # pragma: NO COVER Python3
super_init = super(MIMEApplicationHTTP, self).__init__
super_init(payload, 'http', encode_noop)


class NoContent(object):
"""Emulate an HTTP '204 No Content' response."""
status = 204


class Batch(Connection):
"""Proxy an underlying connection, batching up change operations.

:type connection: :class:`gcloud.storage.connection.Connection`
:param connection: the connection for which the batch proxies.
"""
_MAX_BATCH_SIZE = 1000

def __init__(self, connection):
super(Batch, self).__init__(project=connection.project)
self._connection = connection
self._requests = []
self._responses = []

def _do_request(self, method, url, headers, data):
"""Override Connection: defer actual HTTP request.

Only allow up to ``_MAX_BATCH_SIZE`` requests to be deferred.

:type method: string
:param method: The HTTP method to use in the request.

:type url: string
:param url: The URL to send the request to.

:type headers: dict
:param headers: A dictionary of HTTP headers to send with the request.

:type data: string
:param data: The data to send as the body of the request.

:rtype: tuple of ``response`` (a dictionary of sorts)
and ``content`` (a string).
:returns: The HTTP response object and the content of the response.
"""
if method == 'GET':

This comment was marked as spam.

_req = self._connection.http.request
return _req(method=method, uri=url, headers=headers, body=data)

if len(self._requests) >= self._MAX_BATCH_SIZE:
raise ValueError("Too many deferred requests (max %d)" %
self._MAX_BATCH_SIZE)
self._requests.append((method, url, headers, data))
return NoContent(), ''

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.


def finish(self):
"""Submit a single `multipart/mixed` request w/ deferred requests.

:rtype: list of tuples
:returns: one ``(status, reason, payload)`` tuple per deferred request.
:raises: ValueError if no requests have been deferred.
"""
if len(self._requests) == 0:
raise ValueError("No deferred requests")

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.


multi = MIMEMultipart()

for method, uri, headers, body in self._requests:
subrequest = MIMEApplicationHTTP(method, uri, headers, body)
multi.attach(subrequest)

# The `email` package expects to deal with "native" strings
if six.PY3: # pragma: NO COVER Python3
buf = io.StringIO()

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

else: # pragma: NO COVER Python2
buf = io.BytesIO()
generator = Generator(buf, False, 0)
generator.flatten(multi)
payload = buf.getvalue()

# Strip off redundant header text
_, body = payload.split('\n\n', 1)

This comment was marked as spam.

This comment was marked as spam.

headers = dict(multi._headers)

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.


url = '%s/batch' % self.API_BASE_URL

_req = self._connection._make_request
response, content = _req('POST', url, data=body, headers=headers)
self._responses = list(_unpack_batch_response(response, content))
return self._responses

def __enter__(self):
_BATCHES.push(self)
return self

def __exit__(self, exc_type, exc_val, exc_tb):
try:
if exc_type is None:
self.finish()
finally:
_BATCHES.pop()


def _unpack_batch_response(response, content):
"""Convert response, content -> [(status, reason, payload)]."""
parser = Parser()
faux_message = ('Content-Type: %s\nMIME-Version: 1.0\n\n%s' %
(response['content-type'], content))

message = parser.parsestr(faux_message)

if not isinstance(message._payload, list):
raise ValueError('Bad response: not multi-part')

for subrequest in message._payload:
status_line, rest = subrequest._payload.split('\n', 1)
_, status, reason = status_line.split(' ', 2)
message = parser.parsestr(rest)
payload = message._payload
ctype = message['Content-Type']
if ctype and ctype.startswith('application/json'):
payload = json.loads(payload)
yield status, reason, payload
27 changes: 26 additions & 1 deletion gcloud/storage/connection.py
Original file line number Diff line number Diff line change
Expand Up @@ -149,7 +149,8 @@ def _make_request(self, method, url, data=None, content_type=None,

:rtype: tuple of ``response`` (a dictionary of sorts)
and ``content`` (a string).
:returns: The HTTP response object and the content of the response.
:returns: The HTTP response object and the content of the response,
returned by :meth:`_do_request`.
"""
headers = headers or {}
headers['Accept-Encoding'] = 'gzip'
Expand All @@ -166,6 +167,30 @@ def _make_request(self, method, url, data=None, content_type=None,

headers['User-Agent'] = self.USER_AGENT

return self._do_request(method, url, headers, data)

def _do_request(self, method, url, headers, data):
"""Low-level helper: perform the actual API request over HTTP.

Allows :class:`gcloud.storage.batch.Batch` to override, deferring
the request.

:type method: string
:param method: The HTTP method to use in the request.

:type url: string
:param url: The URL to send the request to.

:type headers: dict
:param headers: A dictionary of HTTP headers to send with the request.

:type data: string
:param data: The data to send as the body of the request.

:rtype: tuple of ``response`` (a dictionary of sorts)
and ``content`` (a string).
:returns: The HTTP response object and the content of the response.
"""
return self.http.request(uri=url, method=method, headers=headers,
body=data)

Expand Down
Loading