blob: a87575184a75142621b171424d578ecc36db0a0f [file] [log] [blame]
Craig Citro751b7fb2014-09-23 11:20:38 -07001# Copyright 2014 Google Inc. All Rights Reserved.
John Asmuth864311d2014-04-24 15:46:08 -04002#
3# Licensed under the Apache License, Version 2.0 (the "License");
4# you may not use this file except in compliance with the License.
5# You may obtain a copy of the License at
6#
7# http://www.apache.org/licenses/LICENSE-2.0
8#
9# Unless required by applicable law or agreed to in writing, software
10# distributed under the License is distributed on an "AS IS" BASIS,
11# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12# See the License for the specific language governing permissions and
13# limitations under the License.
14
15"""Classes to encapsulate a single HTTP request.
16
17The classes implement a command pattern, with every
18object supporting an execute() method that does the
cspeidelfbaf9d72018-05-10 12:50:12 -060019actual HTTP request.
John Asmuth864311d2014-04-24 15:46:08 -040020"""
INADA Naoki0bceb332014-08-20 15:27:52 +090021from __future__ import absolute_import
INADA Naokie4ea1a92015-03-04 03:45:42 +090022import six
eesheeshc6425a02016-02-12 15:07:06 +000023from six.moves import http_client
INADA Naokie4ea1a92015-03-04 03:45:42 +090024from six.moves import range
John Asmuth864311d2014-04-24 15:46:08 -040025
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070026__author__ = "jcgregorio@google.com (Joe Gregorio)"
John Asmuth864311d2014-04-24 15:46:08 -040027
Pat Ferateed9affd2015-03-03 16:03:15 -080028from six import BytesIO, StringIO
Pat Ferated5b61bd2015-03-03 16:04:11 -080029from six.moves.urllib.parse import urlparse, urlunparse, quote, unquote
Pat Ferateed9affd2015-03-03 16:03:15 -080030
John Asmuth864311d2014-04-24 15:46:08 -040031import base64
32import copy
33import gzip
34import httplib2
Craig Citro6ae34d72014-08-18 23:10:09 -070035import json
John Asmuth864311d2014-04-24 15:46:08 -040036import logging
John Asmuth864311d2014-04-24 15:46:08 -040037import mimetypes
38import os
39import random
eesheeshc6425a02016-02-12 15:07:06 +000040import socket
John Asmuth864311d2014-04-24 15:46:08 -040041import sys
42import time
John Asmuth864311d2014-04-24 15:46:08 -040043import uuid
44
Tay Ray Chuan3146c922016-04-20 16:38:19 +000045# TODO(issue 221): Remove this conditional import jibbajabba.
46try:
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070047 import ssl
Tay Ray Chuan3146c922016-04-20 16:38:19 +000048except ImportError:
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070049 _ssl_SSLError = object()
Tay Ray Chuan3146c922016-04-20 16:38:19 +000050else:
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070051 _ssl_SSLError = ssl.SSLError
Tay Ray Chuan3146c922016-04-20 16:38:19 +000052
John Asmuth864311d2014-04-24 15:46:08 -040053from email.generator import Generator
54from email.mime.multipart import MIMEMultipart
55from email.mime.nonmultipart import MIMENonMultipart
56from email.parser import FeedParser
Pat Ferateb240c172015-03-03 16:23:51 -080057
Helen Koikede13e3b2018-04-26 16:05:16 -030058from googleapiclient import _helpers as util
Jon Wayne Parrott6755f612016-08-15 10:52:26 -070059
Jon Wayne Parrottd3a5cf42017-06-19 17:55:04 -070060from googleapiclient import _auth
Pat Ferateb240c172015-03-03 16:23:51 -080061from googleapiclient.errors import BatchError
62from googleapiclient.errors import HttpError
63from googleapiclient.errors import InvalidChunkSizeError
64from googleapiclient.errors import ResumableUploadError
65from googleapiclient.errors import UnexpectedBodyError
66from googleapiclient.errors import UnexpectedMethodError
67from googleapiclient.model import JsonModel
John Asmuth864311d2014-04-24 15:46:08 -040068
69
Emmett Butler09699152016-02-08 14:26:00 -080070LOGGER = logging.getLogger(__name__)
71
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070072DEFAULT_CHUNK_SIZE = 100 * 1024 * 1024
John Asmuth864311d2014-04-24 15:46:08 -040073
74MAX_URI_LENGTH = 2048
75
Xinan Line2dccec2018-12-07 05:28:33 +090076MAX_BATCH_LIMIT = 1000
77
eesheeshc6425a02016-02-12 15:07:06 +000078_TOO_MANY_REQUESTS = 429
79
Igor Maravić22435292017-01-19 22:28:22 +010080DEFAULT_HTTP_TIMEOUT_SEC = 60
81
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070082_LEGACY_BATCH_URI = "https://www.googleapis.com/batch"
Jon Wayne Parrottbae748a2018-03-28 10:21:12 -070083
Damian Gadomskic7516a22020-03-23 20:39:21 +010084if six.PY2:
85 # That's a builtin python3 exception, nonexistent in python2.
86 # Defined to None to avoid NameError while trying to catch it
87 ConnectionError = None
88
eesheeshc6425a02016-02-12 15:07:06 +000089
90def _should_retry_response(resp_status, content):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -070091 """Determines whether a response should be retried.
eesheeshc6425a02016-02-12 15:07:06 +000092
93 Args:
94 resp_status: The response status received.
Nilayan Bhattacharya90ffb852017-12-05 15:30:32 -080095 content: The response content body.
eesheeshc6425a02016-02-12 15:07:06 +000096
97 Returns:
98 True if the response should be retried, otherwise False.
99 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700100 # Retry on 5xx errors.
101 if resp_status >= 500:
102 return True
eesheeshc6425a02016-02-12 15:07:06 +0000103
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700104 # Retry on 429 errors.
105 if resp_status == _TOO_MANY_REQUESTS:
106 return True
eesheeshc6425a02016-02-12 15:07:06 +0000107
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700108 # For 403 errors, we have to check for the `reason` in the response to
109 # determine if we should retry.
110 if resp_status == six.moves.http_client.FORBIDDEN:
111 # If there's no details about the 403 type, don't retry.
112 if not content:
113 return False
eesheeshc6425a02016-02-12 15:07:06 +0000114
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700115 # Content is in JSON format.
116 try:
117 data = json.loads(content.decode("utf-8"))
118 if isinstance(data, dict):
119 reason = data["error"]["errors"][0]["reason"]
120 else:
121 reason = data[0]["error"]["errors"]["reason"]
122 except (UnicodeDecodeError, ValueError, KeyError):
123 LOGGER.warning("Invalid JSON content from response: %s", content)
124 return False
eesheeshc6425a02016-02-12 15:07:06 +0000125
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700126 LOGGER.warning('Encountered 403 Forbidden with reason "%s"', reason)
eesheeshc6425a02016-02-12 15:07:06 +0000127
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700128 # Only retry on rate limit related failures.
129 if reason in ("userRateLimitExceeded", "rateLimitExceeded"):
130 return True
eesheeshc6425a02016-02-12 15:07:06 +0000131
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700132 # Everything else is a success or non-retriable so break.
133 return False
eesheeshc6425a02016-02-12 15:07:06 +0000134
John Asmuth864311d2014-04-24 15:46:08 -0400135
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700136def _retry_request(
137 http, num_retries, req_type, sleep, rand, uri, method, *args, **kwargs
138):
139 """Retries an HTTP request multiple times while handling errors.
Sergiy Byelozyorov703c92c2015-12-21 23:27:48 +0100140
141 If after all retries the request still fails, last error is either returned as
142 return value (for HTTP 5xx errors) or thrown (for ssl.SSLError).
143
144 Args:
145 http: Http object to be used to execute request.
146 num_retries: Maximum number of retries.
147 req_type: Type of the request (used for logging retries).
148 sleep, rand: Functions to sleep for random time between retries.
149 uri: URI to be requested.
150 method: HTTP method to be used.
151 args, kwargs: Additional arguments passed to http.request.
152
153 Returns:
154 resp, content - Response from the http request (may be HTTP 5xx).
155 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700156 resp = None
157 content = None
158 exception = None
159 for retry_num in range(num_retries + 1):
160 if retry_num > 0:
161 # Sleep before retrying.
162 sleep_time = rand() * 2 ** retry_num
163 LOGGER.warning(
164 "Sleeping %.2f seconds before retry %d of %d for %s: %s %s, after %s",
165 sleep_time,
166 retry_num,
167 num_retries,
168 req_type,
169 method,
170 uri,
171 resp.status if resp else exception,
172 )
173 sleep(sleep_time)
Sergiy Byelozyorov703c92c2015-12-21 23:27:48 +0100174
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700175 try:
176 exception = None
177 resp, content = http.request(uri, method, *args, **kwargs)
178 # Retry on SSL errors and socket timeout errors.
179 except _ssl_SSLError as ssl_error:
180 exception = ssl_error
181 except socket.timeout as socket_timeout:
182 # It's important that this be before socket.error as it's a subclass
183 # socket.timeout has no errorcode
184 exception = socket_timeout
Damian Gadomskic7516a22020-03-23 20:39:21 +0100185 except ConnectionError as connection_error:
186 # Needs to be before socket.error as it's a subclass of
187 # OSError (socket.error)
188 exception = connection_error
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700189 except socket.error as socket_error:
190 # errno's contents differ by platform, so we have to match by name.
191 if socket.errno.errorcode.get(socket_error.errno) not in {
192 "WSAETIMEDOUT",
193 "ETIMEDOUT",
194 "EPIPE",
195 "ECONNABORTED",
196 }:
197 raise
198 exception = socket_error
199 except httplib2.ServerNotFoundError as server_not_found_error:
200 exception = server_not_found_error
eesheeshc6425a02016-02-12 15:07:06 +0000201
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700202 if exception:
203 if retry_num == num_retries:
204 raise exception
205 else:
206 continue
eesheeshc6425a02016-02-12 15:07:06 +0000207
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700208 if not _should_retry_response(resp.status, content):
209 break
Sergiy Byelozyorov703c92c2015-12-21 23:27:48 +0100210
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700211 return resp, content
Sergiy Byelozyorov703c92c2015-12-21 23:27:48 +0100212
213
John Asmuth864311d2014-04-24 15:46:08 -0400214class MediaUploadProgress(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700215 """Status of a resumable upload."""
John Asmuth864311d2014-04-24 15:46:08 -0400216
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700217 def __init__(self, resumable_progress, total_size):
218 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400219
220 Args:
221 resumable_progress: int, bytes sent so far.
222 total_size: int, total bytes in complete upload, or None if the total
223 upload size isn't known ahead of time.
224 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700225 self.resumable_progress = resumable_progress
226 self.total_size = total_size
John Asmuth864311d2014-04-24 15:46:08 -0400227
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700228 def progress(self):
229 """Percent of upload completed, as a float.
John Asmuth864311d2014-04-24 15:46:08 -0400230
231 Returns:
232 the percentage complete as a float, returning 0.0 if the total size of
233 the upload is unknown.
234 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700235 if self.total_size is not None and self.total_size != 0:
236 return float(self.resumable_progress) / float(self.total_size)
237 else:
238 return 0.0
John Asmuth864311d2014-04-24 15:46:08 -0400239
240
241class MediaDownloadProgress(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700242 """Status of a resumable download."""
John Asmuth864311d2014-04-24 15:46:08 -0400243
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700244 def __init__(self, resumable_progress, total_size):
245 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400246
247 Args:
248 resumable_progress: int, bytes received so far.
249 total_size: int, total bytes in complete download.
250 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700251 self.resumable_progress = resumable_progress
252 self.total_size = total_size
John Asmuth864311d2014-04-24 15:46:08 -0400253
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700254 def progress(self):
255 """Percent of download completed, as a float.
John Asmuth864311d2014-04-24 15:46:08 -0400256
257 Returns:
258 the percentage complete as a float, returning 0.0 if the total size of
259 the download is unknown.
260 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700261 if self.total_size is not None and self.total_size != 0:
262 return float(self.resumable_progress) / float(self.total_size)
263 else:
264 return 0.0
John Asmuth864311d2014-04-24 15:46:08 -0400265
266
267class MediaUpload(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700268 """Describes a media object to upload.
John Asmuth864311d2014-04-24 15:46:08 -0400269
270 Base class that defines the interface of MediaUpload subclasses.
271
272 Note that subclasses of MediaUpload may allow you to control the chunksize
273 when uploading a media object. It is important to keep the size of the chunk
274 as large as possible to keep the upload efficient. Other factors may influence
275 the size of the chunk you use, particularly if you are working in an
276 environment where individual HTTP requests may have a hardcoded time limit,
277 such as under certain classes of requests under Google App Engine.
278
279 Streams are io.Base compatible objects that support seek(). Some MediaUpload
280 subclasses support using streams directly to upload data. Support for
281 streaming may be indicated by a MediaUpload sub-class and if appropriate for a
282 platform that stream will be used for uploading the media object. The support
283 for streaming is indicated by has_stream() returning True. The stream() method
284 should return an io.Base object that supports seek(). On platforms where the
285 underlying httplib module supports streaming, for example Python 2.6 and
286 later, the stream will be passed into the http library which will result in
287 less memory being used and possibly faster uploads.
288
289 If you need to upload media that can't be uploaded using any of the existing
290 MediaUpload sub-class then you can sub-class MediaUpload for your particular
291 needs.
292 """
293
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700294 def chunksize(self):
295 """Chunk size for resumable uploads.
John Asmuth864311d2014-04-24 15:46:08 -0400296
297 Returns:
298 Chunk size in bytes.
299 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700300 raise NotImplementedError()
John Asmuth864311d2014-04-24 15:46:08 -0400301
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700302 def mimetype(self):
303 """Mime type of the body.
John Asmuth864311d2014-04-24 15:46:08 -0400304
305 Returns:
306 Mime type.
307 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700308 return "application/octet-stream"
John Asmuth864311d2014-04-24 15:46:08 -0400309
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700310 def size(self):
311 """Size of upload.
John Asmuth864311d2014-04-24 15:46:08 -0400312
313 Returns:
314 Size of the body, or None of the size is unknown.
315 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700316 return None
John Asmuth864311d2014-04-24 15:46:08 -0400317
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700318 def resumable(self):
319 """Whether this upload is resumable.
John Asmuth864311d2014-04-24 15:46:08 -0400320
321 Returns:
322 True if resumable upload or False.
323 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700324 return False
John Asmuth864311d2014-04-24 15:46:08 -0400325
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700326 def getbytes(self, begin, end):
327 """Get bytes from the media.
John Asmuth864311d2014-04-24 15:46:08 -0400328
329 Args:
330 begin: int, offset from beginning of file.
331 length: int, number of bytes to read, starting at begin.
332
333 Returns:
334 A string of bytes read. May be shorter than length if EOF was reached
335 first.
336 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700337 raise NotImplementedError()
John Asmuth864311d2014-04-24 15:46:08 -0400338
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700339 def has_stream(self):
340 """Does the underlying upload support a streaming interface.
John Asmuth864311d2014-04-24 15:46:08 -0400341
342 Streaming means it is an io.IOBase subclass that supports seek, i.e.
343 seekable() returns True.
344
345 Returns:
346 True if the call to stream() will return an instance of a seekable io.Base
347 subclass.
348 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700349 return False
John Asmuth864311d2014-04-24 15:46:08 -0400350
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700351 def stream(self):
352 """A stream interface to the data being uploaded.
John Asmuth864311d2014-04-24 15:46:08 -0400353
354 Returns:
355 The returned value is an io.IOBase subclass that supports seek, i.e.
356 seekable() returns True.
357 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700358 raise NotImplementedError()
John Asmuth864311d2014-04-24 15:46:08 -0400359
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700360 @util.positional(1)
361 def _to_json(self, strip=None):
362 """Utility function for creating a JSON representation of a MediaUpload.
John Asmuth864311d2014-04-24 15:46:08 -0400363
364 Args:
365 strip: array, An array of names of members to not include in the JSON.
366
367 Returns:
368 string, a JSON representation of this instance, suitable to pass to
369 from_json().
370 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700371 t = type(self)
372 d = copy.copy(self.__dict__)
373 if strip is not None:
374 for member in strip:
375 del d[member]
376 d["_class"] = t.__name__
377 d["_module"] = t.__module__
378 return json.dumps(d)
John Asmuth864311d2014-04-24 15:46:08 -0400379
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700380 def to_json(self):
381 """Create a JSON representation of an instance of MediaUpload.
John Asmuth864311d2014-04-24 15:46:08 -0400382
383 Returns:
384 string, a JSON representation of this instance, suitable to pass to
385 from_json().
386 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700387 return self._to_json()
John Asmuth864311d2014-04-24 15:46:08 -0400388
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700389 @classmethod
390 def new_from_json(cls, s):
391 """Utility class method to instantiate a MediaUpload subclass from a JSON
John Asmuth864311d2014-04-24 15:46:08 -0400392 representation produced by to_json().
393
394 Args:
395 s: string, JSON from to_json().
396
397 Returns:
398 An instance of the subclass of MediaUpload that was serialized with
399 to_json().
400 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700401 data = json.loads(s)
402 # Find and call the right classmethod from_json() to restore the object.
403 module = data["_module"]
404 m = __import__(module, fromlist=module.split(".")[:-1])
405 kls = getattr(m, data["_class"])
406 from_json = getattr(kls, "from_json")
407 return from_json(s)
John Asmuth864311d2014-04-24 15:46:08 -0400408
409
410class MediaIoBaseUpload(MediaUpload):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700411 """A MediaUpload for a io.Base objects.
John Asmuth864311d2014-04-24 15:46:08 -0400412
413 Note that the Python file object is compatible with io.Base and can be used
414 with this class also.
415
Pat Ferateed9affd2015-03-03 16:03:15 -0800416 fh = BytesIO('...Some data to upload...')
John Asmuth864311d2014-04-24 15:46:08 -0400417 media = MediaIoBaseUpload(fh, mimetype='image/png',
418 chunksize=1024*1024, resumable=True)
419 farm.animals().insert(
420 id='cow',
421 name='cow.png',
422 media_body=media).execute()
423
424 Depending on the platform you are working on, you may pass -1 as the
425 chunksize, which indicates that the entire file should be uploaded in a single
426 request. If the underlying platform supports streams, such as Python 2.6 or
427 later, then this can be very efficient as it avoids multiple connections, and
428 also avoids loading the entire file into memory before sending it. Note that
429 Google App Engine has a 5MB limit on request size, so you should never set
430 your chunksize larger than 5MB, or to -1.
431 """
432
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700433 @util.positional(3)
434 def __init__(self, fd, mimetype, chunksize=DEFAULT_CHUNK_SIZE, resumable=False):
435 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400436
437 Args:
438 fd: io.Base or file object, The source of the bytes to upload. MUST be
439 opened in blocking mode, do not use streams opened in non-blocking mode.
440 The given stream must be seekable, that is, it must be able to call
441 seek() on fd.
442 mimetype: string, Mime-type of the file.
443 chunksize: int, File will be uploaded in chunks of this many bytes. Only
444 used if resumable=True. Pass in a value of -1 if the file is to be
445 uploaded as a single chunk. Note that Google App Engine has a 5MB limit
446 on request size, so you should never set your chunksize larger than 5MB,
447 or to -1.
448 resumable: bool, True if this is a resumable upload. False means upload
449 in a single request.
450 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700451 super(MediaIoBaseUpload, self).__init__()
452 self._fd = fd
453 self._mimetype = mimetype
454 if not (chunksize == -1 or chunksize > 0):
455 raise InvalidChunkSizeError()
456 self._chunksize = chunksize
457 self._resumable = resumable
John Asmuth864311d2014-04-24 15:46:08 -0400458
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700459 self._fd.seek(0, os.SEEK_END)
460 self._size = self._fd.tell()
John Asmuth864311d2014-04-24 15:46:08 -0400461
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700462 def chunksize(self):
463 """Chunk size for resumable uploads.
John Asmuth864311d2014-04-24 15:46:08 -0400464
465 Returns:
466 Chunk size in bytes.
467 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700468 return self._chunksize
John Asmuth864311d2014-04-24 15:46:08 -0400469
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700470 def mimetype(self):
471 """Mime type of the body.
John Asmuth864311d2014-04-24 15:46:08 -0400472
473 Returns:
474 Mime type.
475 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700476 return self._mimetype
John Asmuth864311d2014-04-24 15:46:08 -0400477
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700478 def size(self):
479 """Size of upload.
John Asmuth864311d2014-04-24 15:46:08 -0400480
481 Returns:
482 Size of the body, or None of the size is unknown.
483 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700484 return self._size
John Asmuth864311d2014-04-24 15:46:08 -0400485
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700486 def resumable(self):
487 """Whether this upload is resumable.
John Asmuth864311d2014-04-24 15:46:08 -0400488
489 Returns:
490 True if resumable upload or False.
491 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700492 return self._resumable
John Asmuth864311d2014-04-24 15:46:08 -0400493
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700494 def getbytes(self, begin, length):
495 """Get bytes from the media.
John Asmuth864311d2014-04-24 15:46:08 -0400496
497 Args:
498 begin: int, offset from beginning of file.
499 length: int, number of bytes to read, starting at begin.
500
501 Returns:
502 A string of bytes read. May be shorted than length if EOF was reached
503 first.
504 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700505 self._fd.seek(begin)
506 return self._fd.read(length)
John Asmuth864311d2014-04-24 15:46:08 -0400507
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700508 def has_stream(self):
509 """Does the underlying upload support a streaming interface.
John Asmuth864311d2014-04-24 15:46:08 -0400510
511 Streaming means it is an io.IOBase subclass that supports seek, i.e.
512 seekable() returns True.
513
514 Returns:
515 True if the call to stream() will return an instance of a seekable io.Base
516 subclass.
517 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700518 return True
John Asmuth864311d2014-04-24 15:46:08 -0400519
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700520 def stream(self):
521 """A stream interface to the data being uploaded.
John Asmuth864311d2014-04-24 15:46:08 -0400522
523 Returns:
524 The returned value is an io.IOBase subclass that supports seek, i.e.
525 seekable() returns True.
526 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700527 return self._fd
John Asmuth864311d2014-04-24 15:46:08 -0400528
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700529 def to_json(self):
530 """This upload type is not serializable."""
531 raise NotImplementedError("MediaIoBaseUpload is not serializable.")
John Asmuth864311d2014-04-24 15:46:08 -0400532
533
534class MediaFileUpload(MediaIoBaseUpload):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700535 """A MediaUpload for a file.
John Asmuth864311d2014-04-24 15:46:08 -0400536
537 Construct a MediaFileUpload and pass as the media_body parameter of the
538 method. For example, if we had a service that allowed uploading images:
539
John Asmuth864311d2014-04-24 15:46:08 -0400540 media = MediaFileUpload('cow.png', mimetype='image/png',
541 chunksize=1024*1024, resumable=True)
542 farm.animals().insert(
543 id='cow',
544 name='cow.png',
545 media_body=media).execute()
546
547 Depending on the platform you are working on, you may pass -1 as the
548 chunksize, which indicates that the entire file should be uploaded in a single
549 request. If the underlying platform supports streams, such as Python 2.6 or
550 later, then this can be very efficient as it avoids multiple connections, and
551 also avoids loading the entire file into memory before sending it. Note that
552 Google App Engine has a 5MB limit on request size, so you should never set
553 your chunksize larger than 5MB, or to -1.
554 """
555
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700556 @util.positional(2)
557 def __init__(
558 self, filename, mimetype=None, chunksize=DEFAULT_CHUNK_SIZE, resumable=False
559 ):
560 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400561
562 Args:
563 filename: string, Name of the file.
564 mimetype: string, Mime-type of the file. If None then a mime-type will be
565 guessed from the file extension.
566 chunksize: int, File will be uploaded in chunks of this many bytes. Only
567 used if resumable=True. Pass in a value of -1 if the file is to be
568 uploaded in a single chunk. Note that Google App Engine has a 5MB limit
569 on request size, so you should never set your chunksize larger than 5MB,
570 or to -1.
571 resumable: bool, True if this is a resumable upload. False means upload
572 in a single request.
573 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700574 self._filename = filename
575 fd = open(self._filename, "rb")
576 if mimetype is None:
577 # No mimetype provided, make a guess.
578 mimetype, _ = mimetypes.guess_type(filename)
579 if mimetype is None:
580 # Guess failed, use octet-stream.
581 mimetype = "application/octet-stream"
582 super(MediaFileUpload, self).__init__(
583 fd, mimetype, chunksize=chunksize, resumable=resumable
584 )
John Asmuth864311d2014-04-24 15:46:08 -0400585
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700586 def __del__(self):
587 self._fd.close()
Xiaofei Wang20b67582019-07-17 11:16:53 -0700588
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700589 def to_json(self):
590 """Creating a JSON representation of an instance of MediaFileUpload.
John Asmuth864311d2014-04-24 15:46:08 -0400591
592 Returns:
593 string, a JSON representation of this instance, suitable to pass to
594 from_json().
595 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700596 return self._to_json(strip=["_fd"])
John Asmuth864311d2014-04-24 15:46:08 -0400597
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700598 @staticmethod
599 def from_json(s):
600 d = json.loads(s)
601 return MediaFileUpload(
602 d["_filename"],
603 mimetype=d["_mimetype"],
604 chunksize=d["_chunksize"],
605 resumable=d["_resumable"],
606 )
John Asmuth864311d2014-04-24 15:46:08 -0400607
608
609class MediaInMemoryUpload(MediaIoBaseUpload):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700610 """MediaUpload for a chunk of bytes.
John Asmuth864311d2014-04-24 15:46:08 -0400611
612 DEPRECATED: Use MediaIoBaseUpload with either io.TextIOBase or StringIO for
613 the stream.
614 """
615
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700616 @util.positional(2)
617 def __init__(
618 self,
619 body,
620 mimetype="application/octet-stream",
621 chunksize=DEFAULT_CHUNK_SIZE,
622 resumable=False,
623 ):
624 """Create a new MediaInMemoryUpload.
John Asmuth864311d2014-04-24 15:46:08 -0400625
626 DEPRECATED: Use MediaIoBaseUpload with either io.TextIOBase or StringIO for
627 the stream.
628
629 Args:
630 body: string, Bytes of body content.
631 mimetype: string, Mime-type of the file or default of
632 'application/octet-stream'.
633 chunksize: int, File will be uploaded in chunks of this many bytes. Only
634 used if resumable=True.
635 resumable: bool, True if this is a resumable upload. False means upload
636 in a single request.
637 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700638 fd = BytesIO(body)
639 super(MediaInMemoryUpload, self).__init__(
640 fd, mimetype, chunksize=chunksize, resumable=resumable
641 )
John Asmuth864311d2014-04-24 15:46:08 -0400642
643
644class MediaIoBaseDownload(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700645 """"Download media resources.
John Asmuth864311d2014-04-24 15:46:08 -0400646
647 Note that the Python file object is compatible with io.Base and can be used
648 with this class also.
649
650
651 Example:
652 request = farms.animals().get_media(id='cow')
653 fh = io.FileIO('cow.png', mode='wb')
654 downloader = MediaIoBaseDownload(fh, request, chunksize=1024*1024)
655
656 done = False
657 while done is False:
658 status, done = downloader.next_chunk()
659 if status:
660 print "Download %d%%." % int(status.progress() * 100)
661 print "Download Complete!"
662 """
663
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700664 @util.positional(3)
665 def __init__(self, fd, request, chunksize=DEFAULT_CHUNK_SIZE):
666 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400667
668 Args:
669 fd: io.Base or file object, The stream in which to write the downloaded
670 bytes.
671 request: googleapiclient.http.HttpRequest, the media request to perform in
672 chunks.
673 chunksize: int, File will be downloaded in chunks of this many bytes.
674 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700675 self._fd = fd
676 self._request = request
677 self._uri = request.uri
678 self._chunksize = chunksize
679 self._progress = 0
680 self._total_size = None
681 self._done = False
John Asmuth864311d2014-04-24 15:46:08 -0400682
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700683 # Stubs for testing.
684 self._sleep = time.sleep
685 self._rand = random.random
John Asmuth864311d2014-04-24 15:46:08 -0400686
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700687 self._headers = {}
688 for k, v in six.iteritems(request.headers):
689 # allow users to supply custom headers by setting them on the request
690 # but strip out the ones that are set by default on requests generated by
691 # API methods like Drive's files().get(fileId=...)
692 if not k.lower() in ("accept", "accept-encoding", "user-agent"):
693 self._headers[k] = v
Chris McDonough0dc81bf2018-07-19 11:19:58 -0400694
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700695 @util.positional(1)
696 def next_chunk(self, num_retries=0):
697 """Get the next chunk of the download.
John Asmuth864311d2014-04-24 15:46:08 -0400698
699 Args:
Zhihao Yuancc6d3982016-07-27 11:40:45 -0500700 num_retries: Integer, number of times to retry with randomized
John Asmuth864311d2014-04-24 15:46:08 -0400701 exponential backoff. If all retries fail, the raised HttpError
702 represents the last request. If zero (default), we attempt the
703 request only once.
704
705 Returns:
Nilayan Bhattacharya89906ac2017-10-27 13:47:23 -0700706 (status, done): (MediaDownloadProgress, boolean)
John Asmuth864311d2014-04-24 15:46:08 -0400707 The value of 'done' will be True when the media has been fully
Daniel44067782018-01-16 23:17:56 +0100708 downloaded or the total size of the media is unknown.
John Asmuth864311d2014-04-24 15:46:08 -0400709
710 Raises:
711 googleapiclient.errors.HttpError if the response was not a 2xx.
Tim Gates43fc0cf2020-04-21 08:03:25 +1000712 httplib2.HttpLib2Error if a transport error has occurred.
John Asmuth864311d2014-04-24 15:46:08 -0400713 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700714 headers = self._headers.copy()
715 headers["range"] = "bytes=%d-%d" % (
716 self._progress,
717 self._progress + self._chunksize,
718 )
719 http = self._request.http
John Asmuth864311d2014-04-24 15:46:08 -0400720
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700721 resp, content = _retry_request(
722 http,
723 num_retries,
724 "media download",
725 self._sleep,
726 self._rand,
727 self._uri,
728 "GET",
729 headers=headers,
730 )
John Asmuth864311d2014-04-24 15:46:08 -0400731
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700732 if resp.status in [200, 206]:
733 if "content-location" in resp and resp["content-location"] != self._uri:
734 self._uri = resp["content-location"]
735 self._progress += len(content)
736 self._fd.write(content)
John Asmuth864311d2014-04-24 15:46:08 -0400737
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700738 if "content-range" in resp:
739 content_range = resp["content-range"]
740 length = content_range.rsplit("/", 1)[1]
741 self._total_size = int(length)
742 elif "content-length" in resp:
743 self._total_size = int(resp["content-length"])
John Asmuth864311d2014-04-24 15:46:08 -0400744
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700745 if self._total_size is None or self._progress == self._total_size:
746 self._done = True
747 return MediaDownloadProgress(self._progress, self._total_size), self._done
748 else:
749 raise HttpError(resp, content, uri=self._uri)
John Asmuth864311d2014-04-24 15:46:08 -0400750
751
752class _StreamSlice(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700753 """Truncated stream.
John Asmuth864311d2014-04-24 15:46:08 -0400754
755 Takes a stream and presents a stream that is a slice of the original stream.
756 This is used when uploading media in chunks. In later versions of Python a
757 stream can be passed to httplib in place of the string of data to send. The
758 problem is that httplib just blindly reads to the end of the stream. This
759 wrapper presents a virtual stream that only reads to the end of the chunk.
760 """
761
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700762 def __init__(self, stream, begin, chunksize):
763 """Constructor.
John Asmuth864311d2014-04-24 15:46:08 -0400764
765 Args:
766 stream: (io.Base, file object), the stream to wrap.
767 begin: int, the seek position the chunk begins at.
768 chunksize: int, the size of the chunk.
769 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700770 self._stream = stream
771 self._begin = begin
772 self._chunksize = chunksize
773 self._stream.seek(begin)
John Asmuth864311d2014-04-24 15:46:08 -0400774
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700775 def read(self, n=-1):
776 """Read n bytes.
John Asmuth864311d2014-04-24 15:46:08 -0400777
778 Args:
779 n, int, the number of bytes to read.
780
781 Returns:
782 A string of length 'n', or less if EOF is reached.
783 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700784 # The data left available to read sits in [cur, end)
785 cur = self._stream.tell()
786 end = self._begin + self._chunksize
787 if n == -1 or cur + n > end:
788 n = end - cur
789 return self._stream.read(n)
John Asmuth864311d2014-04-24 15:46:08 -0400790
791
792class HttpRequest(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700793 """Encapsulates a single HTTP request."""
John Asmuth864311d2014-04-24 15:46:08 -0400794
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700795 @util.positional(4)
796 def __init__(
797 self,
798 http,
799 postproc,
800 uri,
801 method="GET",
802 body=None,
803 headers=None,
804 methodId=None,
805 resumable=None,
806 ):
807 """Constructor for an HttpRequest.
John Asmuth864311d2014-04-24 15:46:08 -0400808
809 Args:
810 http: httplib2.Http, the transport object to use to make a request
811 postproc: callable, called on the HTTP response and content to transform
812 it into a data object before returning, or raising an exception
813 on an error.
814 uri: string, the absolute URI to send the request to
815 method: string, the HTTP method to use
816 body: string, the request body of the HTTP request,
817 headers: dict, the HTTP request headers
818 methodId: string, a unique identifier for the API method being called.
819 resumable: MediaUpload, None if this is not a resumbale request.
820 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700821 self.uri = uri
822 self.method = method
823 self.body = body
824 self.headers = headers or {}
825 self.methodId = methodId
826 self.http = http
827 self.postproc = postproc
828 self.resumable = resumable
829 self.response_callbacks = []
830 self._in_error_state = False
John Asmuth864311d2014-04-24 15:46:08 -0400831
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700832 # The size of the non-media part of the request.
833 self.body_size = len(self.body or "")
John Asmuth864311d2014-04-24 15:46:08 -0400834
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700835 # The resumable URI to send chunks to.
836 self.resumable_uri = None
John Asmuth864311d2014-04-24 15:46:08 -0400837
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700838 # The bytes that have been uploaded.
839 self.resumable_progress = 0
John Asmuth864311d2014-04-24 15:46:08 -0400840
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700841 # Stubs for testing.
842 self._rand = random.random
843 self._sleep = time.sleep
John Asmuth864311d2014-04-24 15:46:08 -0400844
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700845 @util.positional(1)
846 def execute(self, http=None, num_retries=0):
847 """Execute the request.
John Asmuth864311d2014-04-24 15:46:08 -0400848
849 Args:
850 http: httplib2.Http, an http object to be used in place of the
851 one the HttpRequest request object was constructed with.
Zhihao Yuancc6d3982016-07-27 11:40:45 -0500852 num_retries: Integer, number of times to retry with randomized
John Asmuth864311d2014-04-24 15:46:08 -0400853 exponential backoff. If all retries fail, the raised HttpError
854 represents the last request. If zero (default), we attempt the
855 request only once.
856
857 Returns:
858 A deserialized object model of the response body as determined
859 by the postproc.
860
861 Raises:
862 googleapiclient.errors.HttpError if the response was not a 2xx.
Tim Gates43fc0cf2020-04-21 08:03:25 +1000863 httplib2.HttpLib2Error if a transport error has occurred.
John Asmuth864311d2014-04-24 15:46:08 -0400864 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700865 if http is None:
866 http = self.http
John Asmuth864311d2014-04-24 15:46:08 -0400867
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700868 if self.resumable:
869 body = None
870 while body is None:
871 _, body = self.next_chunk(http=http, num_retries=num_retries)
872 return body
John Asmuth864311d2014-04-24 15:46:08 -0400873
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700874 # Non-resumable case.
John Asmuth864311d2014-04-24 15:46:08 -0400875
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700876 if "content-length" not in self.headers:
877 self.headers["content-length"] = str(self.body_size)
878 # If the request URI is too long then turn it into a POST request.
879 # Assume that a GET request never contains a request body.
880 if len(self.uri) > MAX_URI_LENGTH and self.method == "GET":
881 self.method = "POST"
882 self.headers["x-http-method-override"] = "GET"
883 self.headers["content-type"] = "application/x-www-form-urlencoded"
884 parsed = urlparse(self.uri)
885 self.uri = urlunparse(
886 (parsed.scheme, parsed.netloc, parsed.path, parsed.params, None, None)
887 )
888 self.body = parsed.query
889 self.headers["content-length"] = str(len(self.body))
John Asmuth864311d2014-04-24 15:46:08 -0400890
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700891 # Handle retries for server-side errors.
892 resp, content = _retry_request(
893 http,
894 num_retries,
895 "request",
896 self._sleep,
897 self._rand,
898 str(self.uri),
899 method=str(self.method),
900 body=self.body,
901 headers=self.headers,
902 )
John Asmuth864311d2014-04-24 15:46:08 -0400903
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700904 for callback in self.response_callbacks:
905 callback(resp)
906 if resp.status >= 300:
907 raise HttpError(resp, content, uri=self.uri)
908 return self.postproc(resp, content)
John Asmuth864311d2014-04-24 15:46:08 -0400909
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700910 @util.positional(2)
911 def add_response_callback(self, cb):
912 """add_response_headers_callback
John Asmuth864311d2014-04-24 15:46:08 -0400913
914 Args:
915 cb: Callback to be called on receiving the response headers, of signature:
916
917 def cb(resp):
918 # Where resp is an instance of httplib2.Response
919 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700920 self.response_callbacks.append(cb)
John Asmuth864311d2014-04-24 15:46:08 -0400921
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700922 @util.positional(1)
923 def next_chunk(self, http=None, num_retries=0):
924 """Execute the next step of a resumable upload.
John Asmuth864311d2014-04-24 15:46:08 -0400925
926 Can only be used if the method being executed supports media uploads and
927 the MediaUpload object passed in was flagged as using resumable upload.
928
929 Example:
930
931 media = MediaFileUpload('cow.png', mimetype='image/png',
932 chunksize=1000, resumable=True)
933 request = farm.animals().insert(
934 id='cow',
935 name='cow.png',
936 media_body=media)
937
938 response = None
939 while response is None:
940 status, response = request.next_chunk()
941 if status:
942 print "Upload %d%% complete." % int(status.progress() * 100)
943
944
945 Args:
946 http: httplib2.Http, an http object to be used in place of the
947 one the HttpRequest request object was constructed with.
Zhihao Yuancc6d3982016-07-27 11:40:45 -0500948 num_retries: Integer, number of times to retry with randomized
John Asmuth864311d2014-04-24 15:46:08 -0400949 exponential backoff. If all retries fail, the raised HttpError
950 represents the last request. If zero (default), we attempt the
951 request only once.
952
953 Returns:
954 (status, body): (ResumableMediaStatus, object)
955 The body will be None until the resumable media is fully uploaded.
956
957 Raises:
958 googleapiclient.errors.HttpError if the response was not a 2xx.
Tim Gates43fc0cf2020-04-21 08:03:25 +1000959 httplib2.HttpLib2Error if a transport error has occurred.
John Asmuth864311d2014-04-24 15:46:08 -0400960 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700961 if http is None:
962 http = self.http
John Asmuth864311d2014-04-24 15:46:08 -0400963
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700964 if self.resumable.size() is None:
965 size = "*"
966 else:
967 size = str(self.resumable.size())
John Asmuth864311d2014-04-24 15:46:08 -0400968
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700969 if self.resumable_uri is None:
970 start_headers = copy.copy(self.headers)
971 start_headers["X-Upload-Content-Type"] = self.resumable.mimetype()
972 if size != "*":
973 start_headers["X-Upload-Content-Length"] = size
974 start_headers["content-length"] = str(self.body_size)
John Asmuth864311d2014-04-24 15:46:08 -0400975
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700976 resp, content = _retry_request(
977 http,
978 num_retries,
979 "resumable URI request",
980 self._sleep,
981 self._rand,
982 self.uri,
983 method=self.method,
984 body=self.body,
985 headers=start_headers,
986 )
John Asmuth864311d2014-04-24 15:46:08 -0400987
Bu Sun Kim66bb32c2019-10-30 10:11:58 -0700988 if resp.status == 200 and "location" in resp:
989 self.resumable_uri = resp["location"]
990 else:
991 raise ResumableUploadError(resp, content)
992 elif self._in_error_state:
993 # If we are in an error state then query the server for current state of
994 # the upload by sending an empty PUT and reading the 'range' header in
995 # the response.
996 headers = {"Content-Range": "bytes */%s" % size, "content-length": "0"}
997 resp, content = http.request(self.resumable_uri, "PUT", headers=headers)
998 status, body = self._process_response(resp, content)
999 if body:
1000 # The upload was complete.
1001 return (status, body)
John Asmuth864311d2014-04-24 15:46:08 -04001002
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001003 if self.resumable.has_stream():
1004 data = self.resumable.stream()
1005 if self.resumable.chunksize() == -1:
1006 data.seek(self.resumable_progress)
1007 chunk_end = self.resumable.size() - self.resumable_progress - 1
1008 else:
1009 # Doing chunking with a stream, so wrap a slice of the stream.
1010 data = _StreamSlice(
1011 data, self.resumable_progress, self.resumable.chunksize()
1012 )
1013 chunk_end = min(
1014 self.resumable_progress + self.resumable.chunksize() - 1,
1015 self.resumable.size() - 1,
1016 )
1017 else:
1018 data = self.resumable.getbytes(
1019 self.resumable_progress, self.resumable.chunksize()
1020 )
John Asmuth864311d2014-04-24 15:46:08 -04001021
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001022 # A short read implies that we are at EOF, so finish the upload.
1023 if len(data) < self.resumable.chunksize():
1024 size = str(self.resumable_progress + len(data))
John Asmuth864311d2014-04-24 15:46:08 -04001025
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001026 chunk_end = self.resumable_progress + len(data) - 1
John Asmuth864311d2014-04-24 15:46:08 -04001027
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001028 headers = {
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001029 # Must set the content-length header here because httplib can't
1030 # calculate the size when working with _StreamSlice.
1031 "Content-Length": str(chunk_end - self.resumable_progress + 1),
John Asmuth864311d2014-04-24 15:46:08 -04001032 }
1033
Bu Sun Kimaf6035f2020-10-20 16:36:04 -06001034 # An empty file results in chunk_end = -1 and size = 0
1035 # sending "bytes 0--1/0" results in an invalid request
1036 # Only add header "Content-Range" if chunk_end != -1
1037 if chunk_end != -1:
1038 headers["Content-Range"] = "bytes %d-%d/%s" % (self.resumable_progress, chunk_end, size)
1039
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001040 for retry_num in range(num_retries + 1):
1041 if retry_num > 0:
1042 self._sleep(self._rand() * 2 ** retry_num)
1043 LOGGER.warning(
1044 "Retry #%d for media upload: %s %s, following status: %d"
1045 % (retry_num, self.method, self.uri, resp.status)
1046 )
John Asmuth864311d2014-04-24 15:46:08 -04001047
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001048 try:
1049 resp, content = http.request(
1050 self.resumable_uri, method="PUT", body=data, headers=headers
1051 )
1052 except:
1053 self._in_error_state = True
1054 raise
1055 if not _should_retry_response(resp.status, content):
1056 break
John Asmuth864311d2014-04-24 15:46:08 -04001057
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001058 return self._process_response(resp, content)
John Asmuth864311d2014-04-24 15:46:08 -04001059
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001060 def _process_response(self, resp, content):
1061 """Process the response from a single chunk upload.
John Asmuth864311d2014-04-24 15:46:08 -04001062
1063 Args:
1064 resp: httplib2.Response, the response object.
1065 content: string, the content of the response.
1066
1067 Returns:
1068 (status, body): (ResumableMediaStatus, object)
1069 The body will be None until the resumable media is fully uploaded.
1070
1071 Raises:
1072 googleapiclient.errors.HttpError if the response was not a 2xx or a 308.
1073 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001074 if resp.status in [200, 201]:
1075 self._in_error_state = False
1076 return None, self.postproc(resp, content)
1077 elif resp.status == 308:
1078 self._in_error_state = False
1079 # A "308 Resume Incomplete" indicates we are not done.
1080 try:
1081 self.resumable_progress = int(resp["range"].split("-")[1]) + 1
1082 except KeyError:
1083 # If resp doesn't contain range header, resumable progress is 0
1084 self.resumable_progress = 0
1085 if "location" in resp:
1086 self.resumable_uri = resp["location"]
1087 else:
1088 self._in_error_state = True
1089 raise HttpError(resp, content, uri=self.uri)
John Asmuth864311d2014-04-24 15:46:08 -04001090
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001091 return (
1092 MediaUploadProgress(self.resumable_progress, self.resumable.size()),
1093 None,
1094 )
John Asmuth864311d2014-04-24 15:46:08 -04001095
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001096 def to_json(self):
1097 """Returns a JSON representation of the HttpRequest."""
1098 d = copy.copy(self.__dict__)
1099 if d["resumable"] is not None:
1100 d["resumable"] = self.resumable.to_json()
1101 del d["http"]
1102 del d["postproc"]
1103 del d["_sleep"]
1104 del d["_rand"]
John Asmuth864311d2014-04-24 15:46:08 -04001105
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001106 return json.dumps(d)
John Asmuth864311d2014-04-24 15:46:08 -04001107
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001108 @staticmethod
1109 def from_json(s, http, postproc):
1110 """Returns an HttpRequest populated with info from a JSON object."""
1111 d = json.loads(s)
1112 if d["resumable"] is not None:
1113 d["resumable"] = MediaUpload.new_from_json(d["resumable"])
1114 return HttpRequest(
1115 http,
1116 postproc,
1117 uri=d["uri"],
1118 method=d["method"],
1119 body=d["body"],
1120 headers=d["headers"],
1121 methodId=d["methodId"],
1122 resumable=d["resumable"],
1123 )
John Asmuth864311d2014-04-24 15:46:08 -04001124
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001125 @staticmethod
1126 def null_postproc(resp, contents):
1127 return resp, contents
1128
John Asmuth864311d2014-04-24 15:46:08 -04001129
1130class BatchHttpRequest(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001131 """Batches multiple HttpRequest objects into a single HTTP request.
John Asmuth864311d2014-04-24 15:46:08 -04001132
1133 Example:
1134 from googleapiclient.http import BatchHttpRequest
1135
1136 def list_animals(request_id, response, exception):
1137 \"\"\"Do something with the animals list response.\"\"\"
1138 if exception is not None:
1139 # Do something with the exception.
1140 pass
1141 else:
1142 # Do something with the response.
1143 pass
1144
1145 def list_farmers(request_id, response, exception):
1146 \"\"\"Do something with the farmers list response.\"\"\"
1147 if exception is not None:
1148 # Do something with the exception.
1149 pass
1150 else:
1151 # Do something with the response.
1152 pass
1153
1154 service = build('farm', 'v2')
1155
1156 batch = BatchHttpRequest()
1157
1158 batch.add(service.animals().list(), list_animals)
1159 batch.add(service.farmers().list(), list_farmers)
1160 batch.execute(http=http)
1161 """
1162
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001163 @util.positional(1)
1164 def __init__(self, callback=None, batch_uri=None):
1165 """Constructor for a BatchHttpRequest.
John Asmuth864311d2014-04-24 15:46:08 -04001166
1167 Args:
1168 callback: callable, A callback to be called for each response, of the
1169 form callback(id, response, exception). The first parameter is the
1170 request id, and the second is the deserialized response object. The
1171 third is an googleapiclient.errors.HttpError exception object if an HTTP error
1172 occurred while processing the request, or None if no error occurred.
1173 batch_uri: string, URI to send batch requests to.
1174 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001175 if batch_uri is None:
1176 batch_uri = _LEGACY_BATCH_URI
Jon Wayne Parrottbae748a2018-03-28 10:21:12 -07001177
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001178 if batch_uri == _LEGACY_BATCH_URI:
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001179 LOGGER.warning(
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001180 "You have constructed a BatchHttpRequest using the legacy batch "
Brad Vogel6ddadd72020-05-15 10:02:04 -07001181 "endpoint %s. This endpoint will be turned down on August 12, 2020. "
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001182 "Please provide the API-specific endpoint or use "
1183 "service.new_batch_http_request(). For more details see "
1184 "https://developers.googleblog.com/2018/03/discontinuing-support-for-json-rpc-and.html"
1185 "and https://developers.google.com/api-client-library/python/guide/batch.",
1186 _LEGACY_BATCH_URI,
1187 )
1188 self._batch_uri = batch_uri
John Asmuth864311d2014-04-24 15:46:08 -04001189
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001190 # Global callback to be called for each individual response in the batch.
1191 self._callback = callback
John Asmuth864311d2014-04-24 15:46:08 -04001192
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001193 # A map from id to request.
1194 self._requests = {}
John Asmuth864311d2014-04-24 15:46:08 -04001195
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001196 # A map from id to callback.
1197 self._callbacks = {}
John Asmuth864311d2014-04-24 15:46:08 -04001198
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001199 # List of request ids, in the order in which they were added.
1200 self._order = []
John Asmuth864311d2014-04-24 15:46:08 -04001201
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001202 # The last auto generated id.
1203 self._last_auto_id = 0
John Asmuth864311d2014-04-24 15:46:08 -04001204
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001205 # Unique ID on which to base the Content-ID headers.
1206 self._base_id = None
John Asmuth864311d2014-04-24 15:46:08 -04001207
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001208 # A map from request id to (httplib2.Response, content) response pairs
1209 self._responses = {}
John Asmuth864311d2014-04-24 15:46:08 -04001210
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001211 # A map of id(Credentials) that have been refreshed.
1212 self._refreshed_credentials = {}
John Asmuth864311d2014-04-24 15:46:08 -04001213
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001214 def _refresh_and_apply_credentials(self, request, http):
1215 """Refresh the credentials and apply to the request.
John Asmuth864311d2014-04-24 15:46:08 -04001216
1217 Args:
1218 request: HttpRequest, the request.
1219 http: httplib2.Http, the global http object for the batch.
1220 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001221 # For the credentials to refresh, but only once per refresh_token
1222 # If there is no http per the request then refresh the http passed in
1223 # via execute()
1224 creds = None
1225 request_credentials = False
Jon Wayne Parrottd3a5cf42017-06-19 17:55:04 -07001226
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001227 if request.http is not None:
1228 creds = _auth.get_credentials_from_http(request.http)
1229 request_credentials = True
Jon Wayne Parrottd3a5cf42017-06-19 17:55:04 -07001230
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001231 if creds is None and http is not None:
1232 creds = _auth.get_credentials_from_http(http)
Jon Wayne Parrottd3a5cf42017-06-19 17:55:04 -07001233
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001234 if creds is not None:
1235 if id(creds) not in self._refreshed_credentials:
1236 _auth.refresh_credentials(creds)
1237 self._refreshed_credentials[id(creds)] = 1
John Asmuth864311d2014-04-24 15:46:08 -04001238
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001239 # Only apply the credentials if we are using the http object passed in,
1240 # otherwise apply() will get called during _serialize_request().
1241 if request.http is None or not request_credentials:
1242 _auth.apply_credentials(creds, request.headers)
Jon Wayne Parrottd3a5cf42017-06-19 17:55:04 -07001243
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001244 def _id_to_header(self, id_):
1245 """Convert an id to a Content-ID header value.
John Asmuth864311d2014-04-24 15:46:08 -04001246
1247 Args:
1248 id_: string, identifier of individual request.
1249
1250 Returns:
1251 A Content-ID header with the id_ encoded into it. A UUID is prepended to
1252 the value because Content-ID headers are supposed to be universally
1253 unique.
1254 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001255 if self._base_id is None:
1256 self._base_id = uuid.uuid4()
John Asmuth864311d2014-04-24 15:46:08 -04001257
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001258 # NB: we intentionally leave whitespace between base/id and '+', so RFC2822
1259 # line folding works properly on Python 3; see
Marie J.I48f503f2020-05-15 13:32:11 -04001260 # https://github.com/googleapis/google-api-python-client/issues/164
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001261 return "<%s + %s>" % (self._base_id, quote(id_))
John Asmuth864311d2014-04-24 15:46:08 -04001262
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001263 def _header_to_id(self, header):
1264 """Convert a Content-ID header value to an id.
John Asmuth864311d2014-04-24 15:46:08 -04001265
1266 Presumes the Content-ID header conforms to the format that _id_to_header()
1267 returns.
1268
1269 Args:
1270 header: string, Content-ID header value.
1271
1272 Returns:
1273 The extracted id value.
1274
1275 Raises:
1276 BatchError if the header is not in the expected format.
1277 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001278 if header[0] != "<" or header[-1] != ">":
1279 raise BatchError("Invalid value for Content-ID: %s" % header)
1280 if "+" not in header:
1281 raise BatchError("Invalid value for Content-ID: %s" % header)
1282 base, id_ = header[1:-1].split(" + ", 1)
John Asmuth864311d2014-04-24 15:46:08 -04001283
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001284 return unquote(id_)
John Asmuth864311d2014-04-24 15:46:08 -04001285
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001286 def _serialize_request(self, request):
1287 """Convert an HttpRequest object into a string.
John Asmuth864311d2014-04-24 15:46:08 -04001288
1289 Args:
1290 request: HttpRequest, the request to serialize.
1291
1292 Returns:
1293 The request as a string in application/http format.
1294 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001295 # Construct status line
1296 parsed = urlparse(request.uri)
1297 request_line = urlunparse(
1298 ("", "", parsed.path, parsed.params, parsed.query, "")
John Asmuth864311d2014-04-24 15:46:08 -04001299 )
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001300 status_line = request.method + " " + request_line + " HTTP/1.1\n"
1301 major, minor = request.headers.get("content-type", "application/json").split(
1302 "/"
1303 )
1304 msg = MIMENonMultipart(major, minor)
1305 headers = request.headers.copy()
John Asmuth864311d2014-04-24 15:46:08 -04001306
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001307 if request.http is not None:
1308 credentials = _auth.get_credentials_from_http(request.http)
1309 if credentials is not None:
1310 _auth.apply_credentials(credentials, headers)
John Asmuth864311d2014-04-24 15:46:08 -04001311
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001312 # MIMENonMultipart adds its own Content-Type header.
1313 if "content-type" in headers:
1314 del headers["content-type"]
John Asmuth864311d2014-04-24 15:46:08 -04001315
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001316 for key, value in six.iteritems(headers):
1317 msg[key] = value
1318 msg["Host"] = parsed.netloc
1319 msg.set_unixfrom(None)
John Asmuth864311d2014-04-24 15:46:08 -04001320
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001321 if request.body is not None:
1322 msg.set_payload(request.body)
1323 msg["content-length"] = str(len(request.body))
John Asmuth864311d2014-04-24 15:46:08 -04001324
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001325 # Serialize the mime message.
1326 fp = StringIO()
1327 # maxheaderlen=0 means don't line wrap headers.
1328 g = Generator(fp, maxheaderlen=0)
1329 g.flatten(msg, unixfrom=False)
1330 body = fp.getvalue()
John Asmuth864311d2014-04-24 15:46:08 -04001331
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001332 return status_line + body
John Asmuth864311d2014-04-24 15:46:08 -04001333
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001334 def _deserialize_response(self, payload):
1335 """Convert string into httplib2 response and content.
John Asmuth864311d2014-04-24 15:46:08 -04001336
1337 Args:
1338 payload: string, headers and body as a string.
1339
1340 Returns:
1341 A pair (resp, content), such as would be returned from httplib2.request.
1342 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001343 # Strip off the status line
1344 status_line, payload = payload.split("\n", 1)
1345 protocol, status, reason = status_line.split(" ", 2)
John Asmuth864311d2014-04-24 15:46:08 -04001346
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001347 # Parse the rest of the response
1348 parser = FeedParser()
1349 parser.feed(payload)
1350 msg = parser.close()
1351 msg["status"] = status
John Asmuth864311d2014-04-24 15:46:08 -04001352
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001353 # Create httplib2.Response from the parsed headers.
1354 resp = httplib2.Response(msg)
1355 resp.reason = reason
1356 resp.version = int(protocol.split("/", 1)[1].replace(".", ""))
John Asmuth864311d2014-04-24 15:46:08 -04001357
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001358 content = payload.split("\r\n\r\n", 1)[1]
John Asmuth864311d2014-04-24 15:46:08 -04001359
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001360 return resp, content
John Asmuth864311d2014-04-24 15:46:08 -04001361
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001362 def _new_id(self):
1363 """Create a new id.
John Asmuth864311d2014-04-24 15:46:08 -04001364
1365 Auto incrementing number that avoids conflicts with ids already used.
1366
1367 Returns:
1368 string, a new unique id.
1369 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001370 self._last_auto_id += 1
1371 while str(self._last_auto_id) in self._requests:
1372 self._last_auto_id += 1
1373 return str(self._last_auto_id)
John Asmuth864311d2014-04-24 15:46:08 -04001374
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001375 @util.positional(2)
1376 def add(self, request, callback=None, request_id=None):
1377 """Add a new request.
John Asmuth864311d2014-04-24 15:46:08 -04001378
1379 Every callback added will be paired with a unique id, the request_id. That
1380 unique id will be passed back to the callback when the response comes back
1381 from the server. The default behavior is to have the library generate it's
1382 own unique id. If the caller passes in a request_id then they must ensure
1383 uniqueness for each request_id, and if they are not an exception is
cspeidelfbaf9d72018-05-10 12:50:12 -06001384 raised. Callers should either supply all request_ids or never supply a
John Asmuth864311d2014-04-24 15:46:08 -04001385 request id, to avoid such an error.
1386
1387 Args:
1388 request: HttpRequest, Request to add to the batch.
1389 callback: callable, A callback to be called for this response, of the
1390 form callback(id, response, exception). The first parameter is the
1391 request id, and the second is the deserialized response object. The
1392 third is an googleapiclient.errors.HttpError exception object if an HTTP error
1393 occurred while processing the request, or None if no errors occurred.
Chris McDonough3cf5e602018-07-18 16:18:38 -04001394 request_id: string, A unique id for the request. The id will be passed
1395 to the callback with the response.
John Asmuth864311d2014-04-24 15:46:08 -04001396
1397 Returns:
1398 None
1399
1400 Raises:
1401 BatchError if a media request is added to a batch.
1402 KeyError is the request_id is not unique.
1403 """
Xinan Line2dccec2018-12-07 05:28:33 +09001404
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001405 if len(self._order) >= MAX_BATCH_LIMIT:
1406 raise BatchError(
1407 "Exceeded the maximum calls(%d) in a single batch request."
1408 % MAX_BATCH_LIMIT
1409 )
1410 if request_id is None:
1411 request_id = self._new_id()
1412 if request.resumable is not None:
1413 raise BatchError("Media requests cannot be used in a batch request.")
1414 if request_id in self._requests:
1415 raise KeyError("A request with this ID already exists: %s" % request_id)
1416 self._requests[request_id] = request
1417 self._callbacks[request_id] = callback
1418 self._order.append(request_id)
John Asmuth864311d2014-04-24 15:46:08 -04001419
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001420 def _execute(self, http, order, requests):
1421 """Serialize batch request, send to server, process response.
John Asmuth864311d2014-04-24 15:46:08 -04001422
1423 Args:
1424 http: httplib2.Http, an http object to be used to make the request with.
1425 order: list, list of request ids in the order they were added to the
1426 batch.
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001427 requests: list, list of request objects to send.
John Asmuth864311d2014-04-24 15:46:08 -04001428
1429 Raises:
Tim Gates43fc0cf2020-04-21 08:03:25 +10001430 httplib2.HttpLib2Error if a transport error has occurred.
John Asmuth864311d2014-04-24 15:46:08 -04001431 googleapiclient.errors.BatchError if the response is the wrong format.
1432 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001433 message = MIMEMultipart("mixed")
1434 # Message should not write out it's own headers.
1435 setattr(message, "_write_headers", lambda self: None)
John Asmuth864311d2014-04-24 15:46:08 -04001436
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001437 # Add all the individual requests.
1438 for request_id in order:
1439 request = requests[request_id]
John Asmuth864311d2014-04-24 15:46:08 -04001440
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001441 msg = MIMENonMultipart("application", "http")
1442 msg["Content-Transfer-Encoding"] = "binary"
1443 msg["Content-ID"] = self._id_to_header(request_id)
John Asmuth864311d2014-04-24 15:46:08 -04001444
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001445 body = self._serialize_request(request)
1446 msg.set_payload(body)
1447 message.attach(msg)
John Asmuth864311d2014-04-24 15:46:08 -04001448
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001449 # encode the body: note that we can't use `as_string`, because
1450 # it plays games with `From ` lines.
1451 fp = StringIO()
1452 g = Generator(fp, mangle_from_=False)
1453 g.flatten(message, unixfrom=False)
1454 body = fp.getvalue()
John Asmuth864311d2014-04-24 15:46:08 -04001455
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001456 headers = {}
1457 headers["content-type"] = (
1458 "multipart/mixed; " 'boundary="%s"'
1459 ) % message.get_boundary()
John Asmuth864311d2014-04-24 15:46:08 -04001460
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001461 resp, content = http.request(
1462 self._batch_uri, method="POST", body=body, headers=headers
1463 )
John Asmuth864311d2014-04-24 15:46:08 -04001464
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001465 if resp.status >= 300:
1466 raise HttpError(resp, content, uri=self._batch_uri)
John Asmuth864311d2014-04-24 15:46:08 -04001467
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001468 # Prepend with a content-type header so FeedParser can handle it.
1469 header = "content-type: %s\r\n\r\n" % resp["content-type"]
1470 # PY3's FeedParser only accepts unicode. So we should decode content
1471 # here, and encode each payload again.
1472 if six.PY3:
1473 content = content.decode("utf-8")
1474 for_parser = header + content
John Asmuth864311d2014-04-24 15:46:08 -04001475
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001476 parser = FeedParser()
1477 parser.feed(for_parser)
1478 mime_response = parser.close()
John Asmuth864311d2014-04-24 15:46:08 -04001479
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001480 if not mime_response.is_multipart():
1481 raise BatchError(
1482 "Response not in multipart/mixed format.", resp=resp, content=content
1483 )
John Asmuth864311d2014-04-24 15:46:08 -04001484
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001485 for part in mime_response.get_payload():
1486 request_id = self._header_to_id(part["Content-ID"])
1487 response, content = self._deserialize_response(part.get_payload())
1488 # We encode content here to emulate normal http response.
1489 if isinstance(content, six.text_type):
1490 content = content.encode("utf-8")
1491 self._responses[request_id] = (response, content)
John Asmuth864311d2014-04-24 15:46:08 -04001492
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001493 @util.positional(1)
1494 def execute(self, http=None):
1495 """Execute all the requests as a single batched HTTP request.
John Asmuth864311d2014-04-24 15:46:08 -04001496
1497 Args:
1498 http: httplib2.Http, an http object to be used in place of the one the
1499 HttpRequest request object was constructed with. If one isn't supplied
1500 then use a http object from the requests in this batch.
1501
1502 Returns:
1503 None
1504
1505 Raises:
Tim Gates43fc0cf2020-04-21 08:03:25 +10001506 httplib2.HttpLib2Error if a transport error has occurred.
John Asmuth864311d2014-04-24 15:46:08 -04001507 googleapiclient.errors.BatchError if the response is the wrong format.
1508 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001509 # If we have no requests return
1510 if len(self._order) == 0:
1511 return None
John Asmuth864311d2014-04-24 15:46:08 -04001512
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001513 # If http is not supplied use the first valid one given in the requests.
1514 if http is None:
1515 for request_id in self._order:
1516 request = self._requests[request_id]
1517 if request is not None:
1518 http = request.http
1519 break
John Asmuth864311d2014-04-24 15:46:08 -04001520
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001521 if http is None:
1522 raise ValueError("Missing a valid http object.")
John Asmuth864311d2014-04-24 15:46:08 -04001523
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001524 # Special case for OAuth2Credentials-style objects which have not yet been
1525 # refreshed with an initial access_token.
1526 creds = _auth.get_credentials_from_http(http)
1527 if creds is not None:
1528 if not _auth.is_valid(creds):
1529 LOGGER.info("Attempting refresh to obtain initial access_token")
1530 _auth.refresh_credentials(creds)
Gabriel Garcia23174be2016-05-25 17:28:07 +02001531
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001532 self._execute(http, self._order, self._requests)
John Asmuth864311d2014-04-24 15:46:08 -04001533
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001534 # Loop over all the requests and check for 401s. For each 401 request the
1535 # credentials should be refreshed and then sent again in a separate batch.
1536 redo_requests = {}
1537 redo_order = []
John Asmuth864311d2014-04-24 15:46:08 -04001538
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001539 for request_id in self._order:
1540 resp, content = self._responses[request_id]
1541 if resp["status"] == "401":
1542 redo_order.append(request_id)
1543 request = self._requests[request_id]
1544 self._refresh_and_apply_credentials(request, http)
1545 redo_requests[request_id] = request
John Asmuth864311d2014-04-24 15:46:08 -04001546
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001547 if redo_requests:
1548 self._execute(http, redo_order, redo_requests)
John Asmuth864311d2014-04-24 15:46:08 -04001549
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001550 # Now process all callbacks that are erroring, and raise an exception for
1551 # ones that return a non-2xx response? Or add extra parameter to callback
1552 # that contains an HttpError?
John Asmuth864311d2014-04-24 15:46:08 -04001553
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001554 for request_id in self._order:
1555 resp, content = self._responses[request_id]
John Asmuth864311d2014-04-24 15:46:08 -04001556
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001557 request = self._requests[request_id]
1558 callback = self._callbacks[request_id]
John Asmuth864311d2014-04-24 15:46:08 -04001559
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001560 response = None
1561 exception = None
1562 try:
1563 if resp.status >= 300:
1564 raise HttpError(resp, content, uri=request.uri)
1565 response = request.postproc(resp, content)
1566 except HttpError as e:
1567 exception = e
John Asmuth864311d2014-04-24 15:46:08 -04001568
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001569 if callback is not None:
1570 callback(request_id, response, exception)
1571 if self._callback is not None:
1572 self._callback(request_id, response, exception)
John Asmuth864311d2014-04-24 15:46:08 -04001573
1574
1575class HttpRequestMock(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001576 """Mock of HttpRequest.
John Asmuth864311d2014-04-24 15:46:08 -04001577
1578 Do not construct directly, instead use RequestMockBuilder.
1579 """
1580
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001581 def __init__(self, resp, content, postproc):
1582 """Constructor for HttpRequestMock
John Asmuth864311d2014-04-24 15:46:08 -04001583
1584 Args:
1585 resp: httplib2.Response, the response to emulate coming from the request
1586 content: string, the response body
1587 postproc: callable, the post processing function usually supplied by
1588 the model class. See model.JsonModel.response() as an example.
1589 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001590 self.resp = resp
1591 self.content = content
1592 self.postproc = postproc
1593 if resp is None:
1594 self.resp = httplib2.Response({"status": 200, "reason": "OK"})
1595 if "reason" in self.resp:
1596 self.resp.reason = self.resp["reason"]
John Asmuth864311d2014-04-24 15:46:08 -04001597
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001598 def execute(self, http=None):
1599 """Execute the request.
John Asmuth864311d2014-04-24 15:46:08 -04001600
1601 Same behavior as HttpRequest.execute(), but the response is
1602 mocked and not really from an HTTP request/response.
1603 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001604 return self.postproc(self.resp, self.content)
John Asmuth864311d2014-04-24 15:46:08 -04001605
1606
1607class RequestMockBuilder(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001608 """A simple mock of HttpRequest
John Asmuth864311d2014-04-24 15:46:08 -04001609
1610 Pass in a dictionary to the constructor that maps request methodIds to
1611 tuples of (httplib2.Response, content, opt_expected_body) that should be
1612 returned when that method is called. None may also be passed in for the
1613 httplib2.Response, in which case a 200 OK response will be generated.
1614 If an opt_expected_body (str or dict) is provided, it will be compared to
1615 the body and UnexpectedBodyError will be raised on inequality.
1616
1617 Example:
1618 response = '{"data": {"id": "tag:google.c...'
1619 requestBuilder = RequestMockBuilder(
1620 {
1621 'plus.activities.get': (None, response),
1622 }
1623 )
1624 googleapiclient.discovery.build("plus", "v1", requestBuilder=requestBuilder)
1625
1626 Methods that you do not supply a response for will return a
1627 200 OK with an empty string as the response content or raise an excpetion
1628 if check_unexpected is set to True. The methodId is taken from the rpcName
1629 in the discovery document.
1630
1631 For more details see the project wiki.
1632 """
1633
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001634 def __init__(self, responses, check_unexpected=False):
1635 """Constructor for RequestMockBuilder
John Asmuth864311d2014-04-24 15:46:08 -04001636
1637 The constructed object should be a callable object
1638 that can replace the class HttpResponse.
1639
1640 responses - A dictionary that maps methodIds into tuples
1641 of (httplib2.Response, content). The methodId
1642 comes from the 'rpcName' field in the discovery
1643 document.
1644 check_unexpected - A boolean setting whether or not UnexpectedMethodError
1645 should be raised on unsupplied method.
1646 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001647 self.responses = responses
1648 self.check_unexpected = check_unexpected
John Asmuth864311d2014-04-24 15:46:08 -04001649
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001650 def __call__(
1651 self,
1652 http,
1653 postproc,
1654 uri,
1655 method="GET",
1656 body=None,
1657 headers=None,
1658 methodId=None,
1659 resumable=None,
1660 ):
1661 """Implements the callable interface that discovery.build() expects
John Asmuth864311d2014-04-24 15:46:08 -04001662 of requestBuilder, which is to build an object compatible with
1663 HttpRequest.execute(). See that method for the description of the
1664 parameters and the expected response.
1665 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001666 if methodId in self.responses:
1667 response = self.responses[methodId]
1668 resp, content = response[:2]
1669 if len(response) > 2:
1670 # Test the body against the supplied expected_body.
1671 expected_body = response[2]
1672 if bool(expected_body) != bool(body):
1673 # Not expecting a body and provided one
1674 # or expecting a body and not provided one.
1675 raise UnexpectedBodyError(expected_body, body)
1676 if isinstance(expected_body, str):
1677 expected_body = json.loads(expected_body)
1678 body = json.loads(body)
1679 if body != expected_body:
1680 raise UnexpectedBodyError(expected_body, body)
1681 return HttpRequestMock(resp, content, postproc)
1682 elif self.check_unexpected:
1683 raise UnexpectedMethodError(methodId=methodId)
1684 else:
1685 model = JsonModel(False)
1686 return HttpRequestMock(None, "{}", model.response)
John Asmuth864311d2014-04-24 15:46:08 -04001687
1688
1689class HttpMock(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001690 """Mock of httplib2.Http"""
John Asmuth864311d2014-04-24 15:46:08 -04001691
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001692 def __init__(self, filename=None, headers=None):
1693 """
John Asmuth864311d2014-04-24 15:46:08 -04001694 Args:
1695 filename: string, absolute filename to read response from
1696 headers: dict, header to return with response
1697 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001698 if headers is None:
1699 headers = {"status": "200"}
1700 if filename:
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001701 with open(filename, "rb") as f:
1702 self.data = f.read()
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001703 else:
1704 self.data = None
1705 self.response_headers = headers
1706 self.headers = None
1707 self.uri = None
1708 self.method = None
1709 self.body = None
1710 self.headers = None
John Asmuth864311d2014-04-24 15:46:08 -04001711
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001712 def request(
1713 self,
1714 uri,
1715 method="GET",
1716 body=None,
1717 headers=None,
1718 redirections=1,
1719 connection_type=None,
1720 ):
1721 self.uri = uri
1722 self.method = method
1723 self.body = body
1724 self.headers = headers
1725 return httplib2.Response(self.response_headers), self.data
John Asmuth864311d2014-04-24 15:46:08 -04001726
Bu Sun Kim98888da2020-09-23 11:10:39 -06001727 def close(self):
1728 return None
John Asmuth864311d2014-04-24 15:46:08 -04001729
1730class HttpMockSequence(object):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001731 """Mock of httplib2.Http
John Asmuth864311d2014-04-24 15:46:08 -04001732
1733 Mocks a sequence of calls to request returning different responses for each
1734 call. Create an instance initialized with the desired response headers
1735 and content and then use as if an httplib2.Http instance.
1736
1737 http = HttpMockSequence([
1738 ({'status': '401'}, ''),
1739 ({'status': '200'}, '{"access_token":"1/3w","expires_in":3600}'),
1740 ({'status': '200'}, 'echo_request_headers'),
1741 ])
1742 resp, content = http.request("http://examples.com")
1743
1744 There are special values you can pass in for content to trigger
1745 behavours that are helpful in testing.
1746
1747 'echo_request_headers' means return the request headers in the response body
1748 'echo_request_headers_as_json' means return the request headers in
1749 the response body
1750 'echo_request_body' means return the request body in the response body
1751 'echo_request_uri' means return the request uri in the response body
1752 """
1753
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001754 def __init__(self, iterable):
1755 """
John Asmuth864311d2014-04-24 15:46:08 -04001756 Args:
1757 iterable: iterable, a sequence of pairs of (headers, body)
1758 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001759 self._iterable = iterable
1760 self.follow_redirects = True
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001761 self.request_sequence = list()
John Asmuth864311d2014-04-24 15:46:08 -04001762
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001763 def request(
1764 self,
1765 uri,
1766 method="GET",
1767 body=None,
1768 headers=None,
1769 redirections=1,
1770 connection_type=None,
1771 ):
Dmitry Frenkelf3348f92020-07-15 13:05:58 -07001772 # Remember the request so after the fact this mock can be examined
1773 self.request_sequence.append((uri, method, body, headers))
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001774 resp, content = self._iterable.pop(0)
Matt McDonaldef6420a2020-04-14 16:28:13 -04001775 content = six.ensure_binary(content)
1776
1777 if content == b"echo_request_headers":
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001778 content = headers
Matt McDonaldef6420a2020-04-14 16:28:13 -04001779 elif content == b"echo_request_headers_as_json":
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001780 content = json.dumps(headers)
Matt McDonaldef6420a2020-04-14 16:28:13 -04001781 elif content == b"echo_request_body":
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001782 if hasattr(body, "read"):
1783 content = body.read()
1784 else:
1785 content = body
Matt McDonaldef6420a2020-04-14 16:28:13 -04001786 elif content == b"echo_request_uri":
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001787 content = uri
1788 if isinstance(content, six.text_type):
1789 content = content.encode("utf-8")
1790 return httplib2.Response(resp), content
John Asmuth864311d2014-04-24 15:46:08 -04001791
1792
1793def set_user_agent(http, user_agent):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001794 """Set the user-agent on every request.
John Asmuth864311d2014-04-24 15:46:08 -04001795
1796 Args:
1797 http - An instance of httplib2.Http
1798 or something that acts like it.
1799 user_agent: string, the value for the user-agent header.
1800
1801 Returns:
1802 A modified instance of http that was passed in.
1803
1804 Example:
1805
1806 h = httplib2.Http()
1807 h = set_user_agent(h, "my-app-name/6.0")
1808
1809 Most of the time the user-agent will be set doing auth, this is for the rare
1810 cases where you are accessing an unauthenticated endpoint.
1811 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001812 request_orig = http.request
John Asmuth864311d2014-04-24 15:46:08 -04001813
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001814 # The closure that will replace 'httplib2.Http.request'.
1815 def new_request(
1816 uri,
1817 method="GET",
1818 body=None,
1819 headers=None,
1820 redirections=httplib2.DEFAULT_MAX_REDIRECTS,
1821 connection_type=None,
1822 ):
1823 """Modify the request headers to add the user-agent."""
1824 if headers is None:
1825 headers = {}
1826 if "user-agent" in headers:
1827 headers["user-agent"] = user_agent + " " + headers["user-agent"]
1828 else:
1829 headers["user-agent"] = user_agent
1830 resp, content = request_orig(
1831 uri,
1832 method=method,
1833 body=body,
1834 headers=headers,
1835 redirections=redirections,
1836 connection_type=connection_type,
1837 )
1838 return resp, content
John Asmuth864311d2014-04-24 15:46:08 -04001839
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001840 http.request = new_request
1841 return http
John Asmuth864311d2014-04-24 15:46:08 -04001842
1843
1844def tunnel_patch(http):
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001845 """Tunnel PATCH requests over POST.
John Asmuth864311d2014-04-24 15:46:08 -04001846 Args:
1847 http - An instance of httplib2.Http
1848 or something that acts like it.
1849
1850 Returns:
1851 A modified instance of http that was passed in.
1852
1853 Example:
1854
1855 h = httplib2.Http()
1856 h = tunnel_patch(h, "my-app-name/6.0")
1857
1858 Useful if you are running on a platform that doesn't support PATCH.
1859 Apply this last if you are using OAuth 1.0, as changing the method
1860 will result in a different signature.
1861 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001862 request_orig = http.request
John Asmuth864311d2014-04-24 15:46:08 -04001863
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001864 # The closure that will replace 'httplib2.Http.request'.
1865 def new_request(
1866 uri,
1867 method="GET",
1868 body=None,
1869 headers=None,
1870 redirections=httplib2.DEFAULT_MAX_REDIRECTS,
1871 connection_type=None,
1872 ):
1873 """Modify the request headers to add the user-agent."""
1874 if headers is None:
1875 headers = {}
1876 if method == "PATCH":
1877 if "oauth_token" in headers.get("authorization", ""):
1878 LOGGER.warning(
1879 "OAuth 1.0 request made with Credentials after tunnel_patch."
1880 )
1881 headers["x-http-method-override"] = "PATCH"
1882 method = "POST"
1883 resp, content = request_orig(
1884 uri,
1885 method=method,
1886 body=body,
1887 headers=headers,
1888 redirections=redirections,
1889 connection_type=connection_type,
1890 )
1891 return resp, content
John Asmuth864311d2014-04-24 15:46:08 -04001892
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001893 http.request = new_request
1894 return http
Igor Maravić22435292017-01-19 22:28:22 +01001895
1896
1897def build_http():
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001898 """Builds httplib2.Http object
Igor Maravić22435292017-01-19 22:28:22 +01001899
1900 Returns:
1901 A httplib2.Http object, which is used to make http requests, and which has timeout set by default.
1902 To override default timeout call
1903
1904 socket.setdefaulttimeout(timeout_in_sec)
1905
1906 before interacting with this method.
1907 """
Bu Sun Kim66bb32c2019-10-30 10:11:58 -07001908 if socket.getdefaulttimeout() is not None:
1909 http_timeout = socket.getdefaulttimeout()
1910 else:
1911 http_timeout = DEFAULT_HTTP_TIMEOUT_SEC
Bu Sun Kimb3b773f2020-03-11 12:58:16 -07001912 http = httplib2.Http(timeout=http_timeout)
1913 # 308's are used by several Google APIs (Drive, YouTube)
1914 # for Resumable Uploads rather than Permanent Redirects.
1915 # This asks httplib2 to exclude 308s from the status codes
1916 # it treats as redirects
Bu Sun Kima480d532020-03-13 12:52:22 -07001917 try:
1918 http.redirect_codes = http.redirect_codes - {308}
1919 except AttributeError:
1920 # Apache Beam tests depend on this library and cannot
1921 # currently upgrade their httplib2 version
1922 # http.redirect_codes does not exist in previous versions
1923 # of httplib2, so pass
1924 pass
Bu Sun Kimb3b773f2020-03-11 12:58:16 -07001925
1926 return http