http.py 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144
  1. # -*- coding: utf-8 -*-
  2. """
  3. oss2.http
  4. ~~~~~~~~
  5. 这个模块包含了HTTP Adapters。尽管OSS Python SDK内部使用requests库进行HTTP通信,但是对使用者是透明的。
  6. 该模块中的 `Session` 、 `Request` 、`Response` 对requests的对应的类做了简单的封装。
  7. """
  8. import platform
  9. import requests
  10. from requests.structures import CaseInsensitiveDict
  11. from . import __version__, defaults
  12. from .compat import to_bytes
  13. from .exceptions import RequestError
  14. from .utils import file_object_remaining_bytes, SizedFileAdapter
  15. import logging
  16. USER_AGENT = 'aliyun-sdk-python/{0}({1}/{2}/{3};{4})'.format(
  17. __version__, platform.system(), platform.release(), platform.machine(), platform.python_version())
  18. logger = logging.getLogger(__name__)
  19. class Session(object):
  20. """属于同一个Session的请求共享一组连接池,如有可能也会重用HTTP连接。"""
  21. def __init__(self):
  22. self.session = requests.Session()
  23. psize = defaults.connection_pool_size
  24. self.session.mount('http://', requests.adapters.HTTPAdapter(pool_connections=psize, pool_maxsize=psize))
  25. self.session.mount('https://', requests.adapters.HTTPAdapter(pool_connections=psize, pool_maxsize=psize))
  26. def do_request(self, req, timeout):
  27. try:
  28. logger.debug("Send request, method: {0}, url: {1}, params: {2}, headers: {3}, timeout: {4}".format(
  29. req.method, req.url, req.params, req.headers, timeout))
  30. return Response(self.session.request(req.method, req.url,
  31. data=req.data,
  32. params=req.params,
  33. headers=req.headers,
  34. stream=True,
  35. timeout=timeout))
  36. except requests.RequestException as e:
  37. raise RequestError(e)
  38. class Request(object):
  39. def __init__(self, method, url,
  40. data=None,
  41. params=None,
  42. headers=None,
  43. app_name=''):
  44. self.method = method
  45. self.url = url
  46. self.data = _convert_request_body(data)
  47. self.params = params or {}
  48. if not isinstance(headers, CaseInsensitiveDict):
  49. self.headers = CaseInsensitiveDict(headers)
  50. else:
  51. self.headers = headers
  52. # tell requests not to add 'Accept-Encoding: gzip, deflate' by default
  53. if 'Accept-Encoding' not in self.headers:
  54. self.headers['Accept-Encoding'] = None
  55. if 'User-Agent' not in self.headers:
  56. if app_name:
  57. self.headers['User-Agent'] = USER_AGENT + '/' + app_name
  58. else:
  59. self.headers['User-Agent'] = USER_AGENT
  60. logger.debug("Init request, method: {0}, url: {1}, params: {2}, headers: {3}".format(method, url, params,
  61. headers))
  62. _CHUNK_SIZE = 8 * 1024
  63. class Response(object):
  64. def __init__(self, response):
  65. self.response = response
  66. self.status = response.status_code
  67. self.headers = response.headers
  68. self.request_id = response.headers.get('x-oss-request-id', '')
  69. # When a response contains no body, iter_content() cannot
  70. # be run twice (requests.exceptions.StreamConsumedError will be raised).
  71. # For details of the issue, please see issue #82
  72. #
  73. # To work around this issue, we simply return b'' when everything has been read.
  74. #
  75. # Note you cannot use self.response.raw.read() to implement self.read(), because
  76. # raw.read() does not uncompress response body when the encoding is gzip etc., and
  77. # we try to avoid depends on details of self.response.raw.
  78. self.__all_read = False
  79. logger.debug("Get response headers, req-id:{0}, status: {1}, headers: {2}".format(self.request_id, self.status,
  80. self.headers))
  81. def read(self, amt=None):
  82. if self.__all_read:
  83. return b''
  84. if amt is None:
  85. content_list = []
  86. for chunk in self.response.iter_content(_CHUNK_SIZE):
  87. content_list.append(chunk)
  88. content = b''.join(content_list)
  89. self.__all_read = True
  90. return content
  91. else:
  92. try:
  93. return next(self.response.iter_content(amt))
  94. except StopIteration:
  95. self.__all_read = True
  96. return b''
  97. def __iter__(self):
  98. return self.response.iter_content(_CHUNK_SIZE)
  99. # requests对于具有fileno()方法的file object,会用fileno()的返回值作为Content-Length。
  100. # 这对于已经读取了部分内容,或执行了seek()的file object是不正确的。
  101. #
  102. # _convert_request_body()对于支持seek()和tell() file object,确保是从
  103. # 当前位置读取,且只读取当前位置到文件结束的内容。
  104. def _convert_request_body(data):
  105. data = to_bytes(data)
  106. if hasattr(data, '__len__'):
  107. return data
  108. if hasattr(data, 'seek') and hasattr(data, 'tell'):
  109. return SizedFileAdapter(data, file_object_remaining_bytes(data))
  110. return data