| from __future__ import absolute_import |
| |
| import email.utils |
| import mimetypes |
| import re |
| |
| from .packages import six |
| |
| |
| def guess_content_type(filename, default="application/octet-stream"): |
| """ |
| Guess the "Content-Type" of a file. |
| |
| :param filename: |
| The filename to guess the "Content-Type" of using :mod:`mimetypes`. |
| :param default: |
| If no "Content-Type" can be guessed, default to `default`. |
| """ |
| if filename: |
| return mimetypes.guess_type(filename)[0] or default |
| return default |
| |
| |
| def format_header_param_rfc2231(name, value): |
| """ |
| Helper function to format and quote a single header parameter using the |
| strategy defined in RFC 2231. |
| |
| Particularly useful for header parameters which might contain |
| non-ASCII values, like file names. This follows |
| `RFC 2388 Section 4.4 <https://tools.ietf.org/html/rfc2388#section-4.4>`_. |
| |
| :param name: |
| The name of the parameter, a string expected to be ASCII only. |
| :param value: |
| The value of the parameter, provided as ``bytes`` or `str``. |
| :ret: |
| An RFC-2231-formatted unicode string. |
| """ |
| if isinstance(value, six.binary_type): |
| value = value.decode("utf-8") |
| |
| if not any(ch in value for ch in '"\\\r\n'): |
| result = u'%s="%s"' % (name, value) |
| try: |
| result.encode("ascii") |
| except (UnicodeEncodeError, UnicodeDecodeError): |
| pass |
| else: |
| return result |
| |
| if six.PY2: # Python 2: |
| value = value.encode("utf-8") |
| |
| # encode_rfc2231 accepts an encoded string and returns an ascii-encoded |
| # string in Python 2 but accepts and returns unicode strings in Python 3 |
| value = email.utils.encode_rfc2231(value, "utf-8") |
| value = "%s*=%s" % (name, value) |
| |
| if six.PY2: # Python 2: |
| value = value.decode("utf-8") |
| |
| return value |
| |
| |
| _HTML5_REPLACEMENTS = { |
| u"\u0022": u"%22", |
| # Replace "\" with "\\". |
| u"\u005C": u"\u005C\u005C", |
| } |
| |
| # All control characters from 0x00 to 0x1F *except* 0x1B. |
| _HTML5_REPLACEMENTS.update( |
| { |
| six.unichr(cc): u"%{:02X}".format(cc) |
| for cc in range(0x00, 0x1F + 1) |
| if cc not in (0x1B,) |
| } |
| ) |
| |
| |
| def _replace_multiple(value, needles_and_replacements): |
| def replacer(match): |
| return needles_and_replacements[match.group(0)] |
| |
| pattern = re.compile( |
| r"|".join([re.escape(needle) for needle in needles_and_replacements.keys()]) |
| ) |
| |
| result = pattern.sub(replacer, value) |
| |
| return result |
| |
| |
| def format_header_param_html5(name, value): |
| """ |
| Helper function to format and quote a single header parameter using the |
| HTML5 strategy. |
| |
| Particularly useful for header parameters which might contain |
| non-ASCII values, like file names. This follows the `HTML5 Working Draft |
| Section 4.10.22.7`_ and matches the behavior of curl and modern browsers. |
| |
| .. _HTML5 Working Draft Section 4.10.22.7: |
| https://w3c.github.io/html/sec-forms.html#multipart-form-data |
| |
| :param name: |
| The name of the parameter, a string expected to be ASCII only. |
| :param value: |
| The value of the parameter, provided as ``bytes`` or `str``. |
| :ret: |
| A unicode string, stripped of troublesome characters. |
| """ |
| if isinstance(value, six.binary_type): |
| value = value.decode("utf-8") |
| |
| value = _replace_multiple(value, _HTML5_REPLACEMENTS) |
| |
| return u'%s="%s"' % (name, value) |
| |
| |
| # For backwards-compatibility. |
| format_header_param = format_header_param_html5 |
| |
| |
| class RequestField(object): |
| """ |
| A data container for request body parameters. |
| |
| :param name: |
| The name of this request field. Must be unicode. |
| :param data: |
| The data/value body. |
| :param filename: |
| An optional filename of the request field. Must be unicode. |
| :param headers: |
| An optional dict-like object of headers to initially use for the field. |
| :param header_formatter: |
| An optional callable that is used to encode and format the headers. By |
| default, this is :func:`format_header_param_html5`. |
| """ |
| |
| def __init__( |
| self, |
| name, |
| data, |
| filename=None, |
| headers=None, |
| header_formatter=format_header_param_html5, |
| ): |
| self._name = name |
| self._filename = filename |
| self.data = data |
| self.headers = {} |
| if headers: |
| self.headers = dict(headers) |
| self.header_formatter = header_formatter |
| |
| @classmethod |
| def from_tuples(cls, fieldname, value, header_formatter=format_header_param_html5): |
| """ |
| A :class:`~urllib3.fields.RequestField` factory from old-style tuple parameters. |
| |
| Supports constructing :class:`~urllib3.fields.RequestField` from |
| parameter of key/value strings AND key/filetuple. A filetuple is a |
| (filename, data, MIME type) tuple where the MIME type is optional. |
| For example:: |
| |
| 'foo': 'bar', |
| 'fakefile': ('foofile.txt', 'contents of foofile'), |
| 'realfile': ('barfile.txt', open('realfile').read()), |
| 'typedfile': ('bazfile.bin', open('bazfile').read(), 'image/jpeg'), |
| 'nonamefile': 'contents of nonamefile field', |
| |
| Field names and filenames must be unicode. |
| """ |
| if isinstance(value, tuple): |
| if len(value) == 3: |
| filename, data, content_type = value |
| else: |
| filename, data = value |
| content_type = guess_content_type(filename) |
| else: |
| filename = None |
| content_type = None |
| data = value |
| |
| request_param = cls( |
| fieldname, data, filename=filename, header_formatter=header_formatter |
| ) |
| request_param.make_multipart(content_type=content_type) |
| |
| return request_param |
| |
| def _render_part(self, name, value): |
| """ |
| Overridable helper function to format a single header parameter. By |
| default, this calls ``self.header_formatter``. |
| |
| :param name: |
| The name of the parameter, a string expected to be ASCII only. |
| :param value: |
| The value of the parameter, provided as a unicode string. |
| """ |
| |
| return self.header_formatter(name, value) |
| |
| def _render_parts(self, header_parts): |
| """ |
| Helper function to format and quote a single header. |
| |
| Useful for single headers that are composed of multiple items. E.g., |
| 'Content-Disposition' fields. |
| |
| :param header_parts: |
| A sequence of (k, v) tuples or a :class:`dict` of (k, v) to format |
| as `k1="v1"; k2="v2"; ...`. |
| """ |
| parts = [] |
| iterable = header_parts |
| if isinstance(header_parts, dict): |
| iterable = header_parts.items() |
| |
| for name, value in iterable: |
| if value is not None: |
| parts.append(self._render_part(name, value)) |
| |
| return u"; ".join(parts) |
| |
| def render_headers(self): |
| """ |
| Renders the headers for this request field. |
| """ |
| lines = [] |
| |
| sort_keys = ["Content-Disposition", "Content-Type", "Content-Location"] |
| for sort_key in sort_keys: |
| if self.headers.get(sort_key, False): |
| lines.append(u"%s: %s" % (sort_key, self.headers[sort_key])) |
| |
| for header_name, header_value in self.headers.items(): |
| if header_name not in sort_keys: |
| if header_value: |
| lines.append(u"%s: %s" % (header_name, header_value)) |
| |
| lines.append(u"\r\n") |
| return u"\r\n".join(lines) |
| |
| def make_multipart( |
| self, content_disposition=None, content_type=None, content_location=None |
| ): |
| """ |
| Makes this request field into a multipart request field. |
| |
| This method overrides "Content-Disposition", "Content-Type" and |
| "Content-Location" headers to the request parameter. |
| |
| :param content_type: |
| The 'Content-Type' of the request body. |
| :param content_location: |
| The 'Content-Location' of the request body. |
| |
| """ |
| self.headers["Content-Disposition"] = content_disposition or u"form-data" |
| self.headers["Content-Disposition"] += u"; ".join( |
| [ |
| u"", |
| self._render_parts( |
| ((u"name", self._name), (u"filename", self._filename)) |
| ), |
| ] |
| ) |
| self.headers["Content-Type"] = content_type |
| self.headers["Content-Location"] = content_location |