mirror of
				https://github.com/django/django.git
				synced 2025-10-25 06:36:07 +00:00 
			
		
		
		
	Fixed #10190 -- Made HttpResponse charset customizable.
Thanks to Simon Charette, Aymeric Augustin, and Tim Graham for reviews and contributions.
This commit is contained in:
		
				
					committed by
					
						 Tim Graham
						Tim Graham
					
				
			
			
				
	
			
			
			
						parent
						
							9d6551204e
						
					
				
				
					commit
					5f2542f12a
				
			| @@ -2,6 +2,7 @@ from __future__ import unicode_literals | |||||||
|  |  | ||||||
| import datetime | import datetime | ||||||
| import json | import json | ||||||
|  | import re | ||||||
| import sys | import sys | ||||||
| import time | import time | ||||||
| from email.header import Header | from email.header import Header | ||||||
| @@ -83,6 +84,9 @@ REASON_PHRASES = { | |||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  | _charset_from_content_type_re = re.compile(r';\s*charset=(?P<charset>[^\s;]+)', re.I) | ||||||
|  |  | ||||||
|  |  | ||||||
| class BadHeaderError(ValueError): | class BadHeaderError(ValueError): | ||||||
|     pass |     pass | ||||||
|  |  | ||||||
| @@ -98,19 +102,15 @@ class HttpResponseBase(six.Iterator): | |||||||
|     status_code = 200 |     status_code = 200 | ||||||
|     reason_phrase = None        # Use default reason phrase for status code. |     reason_phrase = None        # Use default reason phrase for status code. | ||||||
|  |  | ||||||
|     def __init__(self, content_type=None, status=None, reason=None): |     def __init__(self, content_type=None, status=None, reason=None, charset=None): | ||||||
|         # _headers is a mapping of the lower-case name to the original case of |         # _headers is a mapping of the lower-case name to the original case of | ||||||
|         # the header (required for working with legacy systems) and the header |         # the header (required for working with legacy systems) and the header | ||||||
|         # value. Both the name of the header and its value are ASCII strings. |         # value. Both the name of the header and its value are ASCII strings. | ||||||
|         self._headers = {} |         self._headers = {} | ||||||
|         self._charset = settings.DEFAULT_CHARSET |  | ||||||
|         self._closable_objects = [] |         self._closable_objects = [] | ||||||
|         # This parameter is set by the handler. It's necessary to preserve the |         # This parameter is set by the handler. It's necessary to preserve the | ||||||
|         # historical behavior of request_finished. |         # historical behavior of request_finished. | ||||||
|         self._handler_class = None |         self._handler_class = None | ||||||
|         if not content_type: |  | ||||||
|             content_type = "%s; charset=%s" % (settings.DEFAULT_CONTENT_TYPE, |  | ||||||
|                     self._charset) |  | ||||||
|         self.cookies = SimpleCookie() |         self.cookies = SimpleCookie() | ||||||
|         if status is not None: |         if status is not None: | ||||||
|             self.status_code = status |             self.status_code = status | ||||||
| @@ -119,8 +119,27 @@ class HttpResponseBase(six.Iterator): | |||||||
|         elif self.reason_phrase is None: |         elif self.reason_phrase is None: | ||||||
|             self.reason_phrase = REASON_PHRASES.get(self.status_code, |             self.reason_phrase = REASON_PHRASES.get(self.status_code, | ||||||
|                                                     'UNKNOWN STATUS CODE') |                                                     'UNKNOWN STATUS CODE') | ||||||
|  |         self._charset = charset | ||||||
|  |         if content_type is None: | ||||||
|  |             content_type = '%s; charset=%s' % (settings.DEFAULT_CONTENT_TYPE, | ||||||
|  |                                                self.charset) | ||||||
|         self['Content-Type'] = content_type |         self['Content-Type'] = content_type | ||||||
|  |  | ||||||
|  |     @property | ||||||
|  |     def charset(self): | ||||||
|  |         if self._charset is not None: | ||||||
|  |             return self._charset | ||||||
|  |         content_type = self.get('Content-Type', '') | ||||||
|  |         matched = _charset_from_content_type_re.search(content_type) | ||||||
|  |         if matched: | ||||||
|  |             # Extract the charset and strip its double quotes | ||||||
|  |             return matched.group('charset').replace('"', '') | ||||||
|  |         return settings.DEFAULT_CHARSET | ||||||
|  |  | ||||||
|  |     @charset.setter | ||||||
|  |     def charset(self, value): | ||||||
|  |         self._charset = value | ||||||
|  |  | ||||||
|     def serialize_headers(self): |     def serialize_headers(self): | ||||||
|         """HTTP headers as a bytestring.""" |         """HTTP headers as a bytestring.""" | ||||||
|         def to_bytes(val, encoding): |         def to_bytes(val, encoding): | ||||||
| @@ -278,10 +297,10 @@ class HttpResponseBase(six.Iterator): | |||||||
|         if isinstance(value, bytes): |         if isinstance(value, bytes): | ||||||
|             return bytes(value) |             return bytes(value) | ||||||
|         if isinstance(value, six.text_type): |         if isinstance(value, six.text_type): | ||||||
|             return bytes(value.encode(self._charset)) |             return bytes(value.encode(self.charset)) | ||||||
|  |  | ||||||
|         # Handle non-string types (#16494) |         # Handle non-string types (#16494) | ||||||
|         return force_bytes(value, self._charset) |         return force_bytes(value, self.charset) | ||||||
|  |  | ||||||
|     # These methods partially implement the file-like object interface. |     # These methods partially implement the file-like object interface. | ||||||
|     # See http://docs.python.org/lib/bltin-file-objects.html |     # See http://docs.python.org/lib/bltin-file-objects.html | ||||||
|   | |||||||
| @@ -10,7 +10,8 @@ class ContentNotRenderedError(Exception): | |||||||
| class SimpleTemplateResponse(HttpResponse): | class SimpleTemplateResponse(HttpResponse): | ||||||
|     rendering_attrs = ['template_name', 'context_data', '_post_render_callbacks'] |     rendering_attrs = ['template_name', 'context_data', '_post_render_callbacks'] | ||||||
|  |  | ||||||
|     def __init__(self, template, context=None, content_type=None, status=None): |     def __init__(self, template, context=None, content_type=None, status=None, | ||||||
|  |                  charset=None): | ||||||
|         # It would seem obvious to call these next two members 'template' and |         # It would seem obvious to call these next two members 'template' and | ||||||
|         # 'context', but those names are reserved as part of the test Client |         # 'context', but those names are reserved as part of the test Client | ||||||
|         # API. To avoid the name collision, we use tricky-to-debug problems |         # API. To avoid the name collision, we use tricky-to-debug problems | ||||||
| @@ -22,7 +23,7 @@ class SimpleTemplateResponse(HttpResponse): | |||||||
|         # content argument doesn't make sense here because it will be replaced |         # content argument doesn't make sense here because it will be replaced | ||||||
|         # with rendered template so we always pass empty string in order to |         # with rendered template so we always pass empty string in order to | ||||||
|         # prevent errors and provide shorter signature. |         # prevent errors and provide shorter signature. | ||||||
|         super(SimpleTemplateResponse, self).__init__('', content_type, status) |         super(SimpleTemplateResponse, self).__init__('', content_type, status, charset) | ||||||
|  |  | ||||||
|         # _is_rendered tracks whether the template and context has been baked |         # _is_rendered tracks whether the template and context has been baked | ||||||
|         # into a final response. |         # into a final response. | ||||||
| @@ -136,7 +137,7 @@ class TemplateResponse(SimpleTemplateResponse): | |||||||
|     rendering_attrs = SimpleTemplateResponse.rendering_attrs + ['_request', '_current_app'] |     rendering_attrs = SimpleTemplateResponse.rendering_attrs + ['_request', '_current_app'] | ||||||
|  |  | ||||||
|     def __init__(self, request, template, context=None, content_type=None, |     def __init__(self, request, template, context=None, content_type=None, | ||||||
|             status=None, current_app=None): |             status=None, current_app=None, charset=None): | ||||||
|         # self.request gets over-written by django.test.client.Client - and |         # self.request gets over-written by django.test.client.Client - and | ||||||
|         # unlike context_data and template_name the _request should not |         # unlike context_data and template_name the _request should not | ||||||
|         # be considered part of the public API. |         # be considered part of the public API. | ||||||
| @@ -145,7 +146,7 @@ class TemplateResponse(SimpleTemplateResponse): | |||||||
|         # having to avoid needing to create the RequestContext directly |         # having to avoid needing to create the RequestContext directly | ||||||
|         self._current_app = current_app |         self._current_app = current_app | ||||||
|         super(TemplateResponse, self).__init__( |         super(TemplateResponse, self).__init__( | ||||||
|             template, context, content_type, status) |             template, context, content_type, status, charset) | ||||||
|  |  | ||||||
|     def resolve_context(self, context): |     def resolve_context(self, context): | ||||||
|         """Convert context data into a full RequestContext object |         """Convert context data into a full RequestContext object | ||||||
|   | |||||||
| @@ -327,8 +327,8 @@ class SimpleTestCase(unittest.TestCase): | |||||||
|         else: |         else: | ||||||
|             content = response.content |             content = response.content | ||||||
|         if not isinstance(text, bytes) or html: |         if not isinstance(text, bytes) or html: | ||||||
|             text = force_text(text, encoding=response._charset) |             text = force_text(text, encoding=response.charset) | ||||||
|             content = content.decode(response._charset) |             content = content.decode(response.charset) | ||||||
|             text_repr = "'%s'" % text |             text_repr = "'%s'" % text | ||||||
|         else: |         else: | ||||||
|             text_repr = repr(text) |             text_repr = repr(text) | ||||||
|   | |||||||
| @@ -627,6 +627,15 @@ Attributes | |||||||
|     A bytestring representing the content, encoded from a Unicode |     A bytestring representing the content, encoded from a Unicode | ||||||
|     object if necessary. |     object if necessary. | ||||||
|  |  | ||||||
|  | .. attribute:: HttpResponse.charset | ||||||
|  |  | ||||||
|  |     .. versionadded:: 1.8 | ||||||
|  |  | ||||||
|  |     A string denoting the charset in which the response will be encoded. If not | ||||||
|  |     given at ``HttpResponse`` instantiation time, it will be extracted from | ||||||
|  |     ``content_type`` and if that is unsuccessful, the | ||||||
|  |     :setting:`DEFAULT_CHARSET` setting will be used. | ||||||
|  |  | ||||||
| .. attribute:: HttpResponse.status_code | .. attribute:: HttpResponse.status_code | ||||||
|  |  | ||||||
|     The `HTTP status code`_ for the response. |     The `HTTP status code`_ for the response. | ||||||
| @@ -645,7 +654,7 @@ Attributes | |||||||
| Methods | Methods | ||||||
| ------- | ------- | ||||||
|  |  | ||||||
| .. method:: HttpResponse.__init__(content='', content_type=None, status=200, reason=None) | .. method:: HttpResponse.__init__(content='', content_type=None, status=200, reason=None, charset=None) | ||||||
|  |  | ||||||
|     Instantiates an ``HttpResponse`` object with the given page content and |     Instantiates an ``HttpResponse`` object with the given page content and | ||||||
|     content type. |     content type. | ||||||
| @@ -666,6 +675,14 @@ Methods | |||||||
|     ``reason`` is the HTTP response phrase. If not provided, a default phrase |     ``reason`` is the HTTP response phrase. If not provided, a default phrase | ||||||
|     will be used. |     will be used. | ||||||
|  |  | ||||||
|  |     ``charset`` is the charset in which the response will be encoded. If not | ||||||
|  |     given it will be extracted from ``content_type``, and if that | ||||||
|  |     is unsuccessful, the :setting:`DEFAULT_CHARSET` setting will be used. | ||||||
|  |  | ||||||
|  |     .. versionadded:: 1.8 | ||||||
|  |  | ||||||
|  |         The ``charset`` parameter was added. | ||||||
|  |  | ||||||
| .. method:: HttpResponse.__setitem__(header, value) | .. method:: HttpResponse.__setitem__(header, value) | ||||||
|  |  | ||||||
|     Sets the given header name to the given value. Both ``header`` and |     Sets the given header name to the given value. Both ``header`` and | ||||||
|   | |||||||
| @@ -56,7 +56,7 @@ Attributes | |||||||
| Methods | Methods | ||||||
| ------- | ------- | ||||||
|  |  | ||||||
| .. method:: SimpleTemplateResponse.__init__(template, context=None, content_type=None, status=None) | .. method:: SimpleTemplateResponse.__init__(template, context=None, content_type=None, status=None, charset=None) | ||||||
|  |  | ||||||
|     Instantiates a |     Instantiates a | ||||||
|     :class:`~django.template.response.SimpleTemplateResponse` object |     :class:`~django.template.response.SimpleTemplateResponse` object | ||||||
| @@ -80,6 +80,15 @@ Methods | |||||||
|         ``content_type`` is specified, then its value is used. Otherwise, |         ``content_type`` is specified, then its value is used. Otherwise, | ||||||
|         :setting:`DEFAULT_CONTENT_TYPE` is used. |         :setting:`DEFAULT_CONTENT_TYPE` is used. | ||||||
|  |  | ||||||
|  |     ``charset`` | ||||||
|  |         The charset in which the response will be encoded. If not given it will | ||||||
|  |         be extracted from ``content_type``, and if that is unsuccessful, the | ||||||
|  |         :setting:`DEFAULT_CHARSET` setting will be used. | ||||||
|  |  | ||||||
|  |     .. versionadded:: 1.8 | ||||||
|  |  | ||||||
|  |         The ``charset`` parameter was added. | ||||||
|  |  | ||||||
| .. method:: SimpleTemplateResponse.resolve_context(context) | .. method:: SimpleTemplateResponse.resolve_context(context) | ||||||
|  |  | ||||||
|     Converts context data into a context instance that can be used for |     Converts context data into a context instance that can be used for | ||||||
| @@ -140,7 +149,7 @@ TemplateResponse objects | |||||||
| Methods | Methods | ||||||
| ------- | ------- | ||||||
|  |  | ||||||
| .. method:: TemplateResponse.__init__(request, template, context=None, content_type=None, status=None, current_app=None) | .. method:: TemplateResponse.__init__(request, template, context=None, content_type=None, status=None, current_app=None, charset=None) | ||||||
|  |  | ||||||
|     Instantiates an ``TemplateResponse`` object with the given |     Instantiates an ``TemplateResponse`` object with the given | ||||||
|     template, context, MIME type and HTTP status. |     template, context, MIME type and HTTP status. | ||||||
| @@ -173,6 +182,14 @@ Methods | |||||||
|         :ref:`namespaced URL resolution strategy <topics-http-reversing-url-namespaces>` |         :ref:`namespaced URL resolution strategy <topics-http-reversing-url-namespaces>` | ||||||
|         for more information. |         for more information. | ||||||
|  |  | ||||||
|  |     ``charset`` | ||||||
|  |         The charset in which the response will be encoded. If not given it will | ||||||
|  |         be extracted from ``content_type``, and if that is unsuccessful, the | ||||||
|  |         :setting:`DEFAULT_CHARSET` setting will be used. | ||||||
|  |  | ||||||
|  |     .. versionadded:: 1.8 | ||||||
|  |  | ||||||
|  |         The ``charset`` parameter was added. | ||||||
|  |  | ||||||
| The rendering process | The rendering process | ||||||
| ===================== | ===================== | ||||||
|   | |||||||
| @@ -278,6 +278,9 @@ Requests and Responses | |||||||
|   This brings this class into line with the documentation and with |   This brings this class into line with the documentation and with | ||||||
|   ``WSGIRequest``. |   ``WSGIRequest``. | ||||||
|  |  | ||||||
|  | * The :attr:`HttpResponse.charset <django.http.HttpResponse.charset>` attribute | ||||||
|  |   was added. | ||||||
|  |  | ||||||
| Tests | Tests | ||||||
| ^^^^^ | ^^^^^ | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,8 +1,16 @@ | |||||||
|  | # -*- coding: utf-8 -*- | ||||||
|  |  | ||||||
|  | from __future__ import unicode_literals | ||||||
|  |  | ||||||
|  | from django.conf import settings | ||||||
| from django.http import HttpResponse | from django.http import HttpResponse | ||||||
| import unittest | from django.test import SimpleTestCase | ||||||
|  |  | ||||||
|  | UTF8 = 'utf-8' | ||||||
|  | ISO88591 = 'iso-8859-1' | ||||||
|  |  | ||||||
|  |  | ||||||
| class HttpResponseTests(unittest.TestCase): | class HttpResponseTests(SimpleTestCase): | ||||||
|  |  | ||||||
|     def test_status_code(self): |     def test_status_code(self): | ||||||
|         resp = HttpResponse(status=418) |         resp = HttpResponse(status=418) | ||||||
| @@ -14,3 +22,45 @@ class HttpResponseTests(unittest.TestCase): | |||||||
|         resp = HttpResponse(status=814, reason=reason) |         resp = HttpResponse(status=814, reason=reason) | ||||||
|         self.assertEqual(resp.status_code, 814) |         self.assertEqual(resp.status_code, 814) | ||||||
|         self.assertEqual(resp.reason_phrase, reason) |         self.assertEqual(resp.reason_phrase, reason) | ||||||
|  |  | ||||||
|  |     def test_charset_detection(self): | ||||||
|  |         """ HttpResponse should parse charset from content_type.""" | ||||||
|  |         response = HttpResponse('ok') | ||||||
|  |         self.assertEqual(response.charset, settings.DEFAULT_CHARSET) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(charset=ISO88591) | ||||||
|  |         self.assertEqual(response.charset, ISO88591) | ||||||
|  |         self.assertEqual(response['Content-Type'], 'text/html; charset=%s' % ISO88591) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(content_type='text/plain; charset=%s' % UTF8, charset=ISO88591) | ||||||
|  |         self.assertEqual(response.charset, ISO88591) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(content_type='text/plain; charset=%s' % ISO88591) | ||||||
|  |         self.assertEqual(response.charset, ISO88591) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(content_type='text/plain; charset="%s"' % ISO88591) | ||||||
|  |         self.assertEqual(response.charset, ISO88591) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(content_type='text/plain; charset=') | ||||||
|  |         self.assertEqual(response.charset, settings.DEFAULT_CHARSET) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(content_type='text/plain') | ||||||
|  |         self.assertEqual(response.charset, settings.DEFAULT_CHARSET) | ||||||
|  |  | ||||||
|  |     def test_response_content_charset(self): | ||||||
|  |         """HttpResponse should encode based on charset.""" | ||||||
|  |         content = "Café :)" | ||||||
|  |         utf8_content = content.encode(UTF8) | ||||||
|  |         iso_content = content.encode(ISO88591) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(utf8_content) | ||||||
|  |         self.assertContains(response, utf8_content) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(iso_content, content_type='text/plain; charset=%s' % ISO88591) | ||||||
|  |         self.assertContains(response, iso_content) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(iso_content) | ||||||
|  |         self.assertContains(response, iso_content) | ||||||
|  |  | ||||||
|  |         response = HttpResponse(iso_content, content_type='text/plain') | ||||||
|  |         self.assertContains(response, iso_content) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user