{
  "instance_id": "django__django-15347",
  "repo": "django/django",
  "created_at": "2022-01-22T01:56:48Z",
  "problem_statement": "Messages framework incorrectly serializes/deserializes extra_tags when it's an empty string\nDescription\n\t\nWhen a message is serialised and then deserialised with any of the built in storage backends, then extra_tags==\"\" is converted to extra_tags==None. This is because MessageEncoder checks for the truthyness of extra_tags rather than checking it is not None.\nTo replicate this bug\n>>> from django.conf import settings\n>>> settings.configure() # Just to allow the following import\n>>> from django.contrib.messages.storage.base import Message\n>>> from django.contrib.messages.storage.cookie import MessageEncoder, MessageDecoder\n>>> original_message = Message(10, \"Here is a message\", extra_tags=\"\")\n>>> encoded_message = MessageEncoder().encode(original_message)\n>>> decoded_message = MessageDecoder().decode(encoded_message)\n>>> original_message.extra_tags == \"\"\nTrue\n>>> decoded_message.extra_tags is None\nTrue\nEffect of the bug in application behaviour\nThis error occurred in the wild with a template tag similar to the following:\n{% if x not in message.extra_tags %}\nWhen the message was displayed as part of a redirect, it had been serialised and deserialized which meant that extra_tags was None instead of the empty string. This caused an error.\nIt's important to note that this bug affects all of the standard API (messages.debug, messages.info etc. all have a default value of extra_tags equal to \"\").\n",
  "patch": "diff --git a/django/contrib/messages/storage/cookie.py b/django/contrib/messages/storage/cookie.py\n--- a/django/contrib/messages/storage/cookie.py\n+++ b/django/contrib/messages/storage/cookie.py\n@@ -19,7 +19,7 @@ def default(self, obj):\n             # Using 0/1 here instead of False/True to produce more compact json\n             is_safedata = 1 if isinstance(obj.message, SafeData) else 0\n             message = [self.message_key, is_safedata, obj.level, obj.message]\n-            if obj.extra_tags:\n+            if obj.extra_tags is not None:\n                 message.append(obj.extra_tags)\n             return message\n         return super().default(obj)\n",
  "similar_bug_items": [
    {
      "pr_number": 6540,
      "pr_title": "Fixed #26341 (again) -- Addressed multiple occurrences per line use case",
      "pr_body": "",
      "issue_id": 26341,
      "issue_title": "Weird comments in PO files (.html.py filenames)",
      "issue_body": "",
      "issue_closed_at": "2016-04-30T05:07:43",
      "base_commit": "4e2ee8662753ca6a2619039b903f11c60709f398",
      "changes": [
        {
          "file": "django/core/management/commands/makemessages.py",
          "type": "function",
          "name": "postprocess_messages",
          "class_name": "BuildFile",
          "code": "def postprocess_messages(self, msgs):\n        \"\"\"\n        Postprocess messages generated by xgettext GNU gettext utility.\n\n        Transform paths as if these messages were generated from original\n        translatable files rather than from preprocessed versions.\n        \"\"\"\n        if not self.is_templatized:\n            return msgs\n\n        # Remove '.py' suffix\n        if os.name == 'nt':\n            # Preserve '.\\' prefix on Windows to respect gettext behavior\n            old_path = self.work_path\n            new_path = self.path\n        else:\n            old_path = self.work_path[2:]\n            new_path = self.path[2:]\n\n        return re.sub(\n            r'^(#: .*)(' + re.escape(old_path) + r')',\n            r'\\1' + new_path,\n            msgs,\n            flags=re.MULTILINE\n        )"
        }
      ]
    },
    {
      "pr_number": 12263,
      "pr_title": "Fixed #31166 -- Used \"raise from\" when raising ImproperlyConfigured exceptions in django.urls.resolvers.",
      "pr_body": "This will make it have a text of \"this exception is the direct result of\" instead of \"During handling of the above exception, another exception occurred\" \r\n\r\nThis is more accurate for the case of this exception.",
      "issue_id": 31166,
      "issue_title": "Provide context for ImproperlyConfigured exceptions in URL resolver.",
      "issue_body": "",
      "issue_closed_at": "2020-01-17T05:21:04",
      "base_commit": "73563183c2ea92e9ef1d3a1f790a503acc14ade2",
      "changes": [
        {
          "file": "django/urls/resolvers.py",
          "type": "function",
          "name": "_compile",
          "class_name": "RoutePattern",
          "code": "def _compile(self, route):\n        return re.compile(_route_to_regex(route, self._is_endpoint)[0])"
        },
        {
          "file": "django/urls/resolvers.py",
          "type": "function",
          "name": "_route_to_regex",
          "class_name": null,
          "code": "def _route_to_regex(route, is_endpoint=False):\n    \"\"\"\n    Convert a path pattern into a regular expression. Return the regular\n    expression and a dictionary mapping the capture names to the converters.\n    For example, 'foo/<int:pk>' returns '^foo\\\\/(?P<pk>[0-9]+)'\n    and {'pk': <django.urls.converters.IntConverter>}.\n    \"\"\"\n    if not set(route).isdisjoint(string.whitespace):\n        raise ImproperlyConfigured(\"URL route '%s' cannot contain whitespace.\" % route)\n    original_route = route\n    parts = ['^']\n    converters = {}\n    while True:\n        match = _PATH_PARAMETER_COMPONENT_RE.search(route)\n        if not match:\n            parts.append(re.escape(route))\n            break\n        parts.append(re.escape(route[:match.start()]))\n        route = route[match.end():]\n        parameter = match.group('parameter')\n        if not parameter.isidentifier():\n            raise ImproperlyConfigured(\n                \"URL route '%s' uses parameter name %r which isn't a valid \"\n                \"Python identifier.\" % (original_route, parameter)\n            )\n        raw_converter = match.group('converter')\n        if raw_converter is None:\n            # If a converter isn't specified, the default is `str`.\n            raw_converter = 'str'\n        try:\n            converter = get_converter(raw_converter)\n        except KeyError as e:\n            raise ImproperlyConfigured(\n                \"URL route '%s' uses invalid converter %s.\" % (original_route, e)\n            )\n        converters[parameter] = converter\n        parts.append('(?P<' + parameter + '>' + converter.regex + ')')\n    if is_endpoint:\n        parts.append('$')\n    return ''.join(parts), converters"
        },
        {
          "file": "django/urls/resolvers.py",
          "type": "function",
          "name": "url_patterns",
          "class_name": "URLResolver",
          "code": "def url_patterns(self):\n        # urlconf_module might be a valid set of patterns, so we default to it\n        patterns = getattr(self.urlconf_module, \"urlpatterns\", self.urlconf_module)\n        try:\n            iter(patterns)\n        except TypeError:\n            msg = (\n                \"The included URLconf '{name}' does not appear to have any \"\n                \"patterns in it. If you see valid patterns in the file then \"\n                \"the issue is probably caused by a circular import.\"\n            )\n            raise ImproperlyConfigured(msg.format(name=self.urlconf_name))\n        return patterns"
        }
      ]
    },
    {
      "pr_number": 9112,
      "pr_title": "Fixed #27846 -- clear all cached reverse relationships on refresh_from_db()",
      "pr_body": "https://code.djangoproject.com/ticket/27846",
      "issue_id": 27846,
      "issue_title": "refresh_from_db() doesn't clear reverse OneToOneFields",
      "issue_body": "",
      "issue_closed_at": "2017-10-12T16:25:22",
      "base_commit": "df0aebc893973c78d7d2cda712ba4133dbe29b6e",
      "changes": [
        {
          "file": "django/db/models/base.py",
          "type": "function",
          "name": "refresh_from_db",
          "class_name": "Model",
          "code": "def refresh_from_db(self, using=None, fields=None):\n        \"\"\"\n        Reload field values from the database.\n\n        By default, the reloading happens from the database this instance was\n        loaded from, or by the read router if this instance wasn't loaded from\n        any database. The using parameter will override the default.\n\n        Fields can be used to specify which fields to reload. The fields\n        should be an iterable of field attnames. If fields is None, then\n        all non-deferred fields are reloaded.\n\n        When accessing deferred fields of an instance, the deferred loading\n        of the field will call this method.\n        \"\"\"\n        if fields is not None:\n            if len(fields) == 0:\n                return\n            if any(LOOKUP_SEP in f for f in fields):\n                raise ValueError(\n                    'Found \"%s\" in fields argument. Relations and transforms '\n                    'are not allowed in fields.' % LOOKUP_SEP)\n\n        db = using if using is not None else self._state.db\n        db_instance_qs = self.__class__._default_manager.using(db).filter(pk=self.pk)\n\n        # Use provided fields, if not set then reload all non-deferred fields.\n        deferred_fields = self.get_deferred_fields()\n        if fields is not None:\n            fields = list(fields)\n            db_instance_qs = db_instance_qs.only(*fields)\n        elif deferred_fields:\n            fields = [f.attname for f in self._meta.concrete_fields\n                      if f.attname not in deferred_fields]\n            db_instance_qs = db_instance_qs.only(*fields)\n\n        db_instance = db_instance_qs.get()\n        non_loaded_fields = db_instance.get_deferred_fields()\n        for field in self._meta.concrete_fields:\n            if field.attname in non_loaded_fields:\n                # This field wasn't refreshed - skip ahead.\n                continue\n            setattr(self, field.attname, getattr(db_instance, field.attname))\n            # Throw away stale foreign key references.\n            if field.is_relation and field.is_cached(self):\n                rel_instance = field.get_cached_value(self)\n                local_val = getattr(db_instance, field.attname)\n                related_val = None if rel_instance is None else getattr(rel_instance, field.target_field.attname)\n                if local_val != related_val or (local_val is None and related_val is None):\n                    field.delete_cached_value(self)\n        self._state.db = db_instance._state.db"
        }
      ]
    },
    {
      "pr_number": 13800,
      "pr_title": "Fixed #32191 -- Made CookieStorage use RFC 6265 compliant format.",
      "pr_body": "Continues work by Florian Apolloner in this [PR](https://github.com/django/django/pull/13793).\r\nThe aim is to make messages, when stored in cookies, compliant with RFC6265 which defines allowed characters for cookies. It does this by base64 encoding them, and then to reduce their size, it compresses them using zlib.\r\nThis fix is achieved by introducing `sign_object` and `unsign_object` into the base signer class.",
      "issue_id": 32191,
      "issue_title": "Not RFC 6265 compliant cookies in contrib.messages.",
      "issue_body": "",
      "issue_closed_at": "2021-01-07T06:20:56",
      "base_commit": "3eb98743dcaa0b7abd2d5832cba8cc9cb586a964",
      "changes": [
        {
          "file": "django/contrib/messages/storage/cookie.py",
          "type": "class",
          "name": "MessageEncoder",
          "code": "class MessageEncoder(json.JSONEncoder):\n    \"\"\"\n    Compactly serialize instances of the ``Message`` class as JSON.\n    \"\"\"\n    message_key = '__json_message'\n\n    def __init__(self, *args, **kwargs):\n        kwargs.setdefault('separators', (',', ':'))\n        super().__init__(*args, **kwargs)\n\n    def default(self, obj):\n        if isinstance(obj, Message):\n            # Using 0/1 here instead of False/True to produce more compact json\n            is_safedata = 1 if isinstance(obj.message, SafeData) else 0\n            message = [self.message_key, is_safedata, obj.level, obj.message]\n            if obj.extra_tags:\n                message.append(obj.extra_tags)\n            return message\n        return super().default(obj)"
        },
        {
          "file": "django/contrib/messages/storage/cookie.py",
          "type": "function",
          "name": "decode",
          "class_name": "MessageDecoder",
          "code": "def decode(self, s, **kwargs):\n        decoded = super().decode(s, **kwargs)\n        return self.process_messages(decoded)"
        },
        {
          "file": "django/contrib/messages/storage/cookie.py",
          "type": "function",
          "name": "_encode",
          "class_name": "CookieStorage",
          "code": "def _encode(self, messages, encode_empty=False):\n        \"\"\"\n        Return an encoded version of the messages list which can be stored as\n        plain text.\n\n        Since the data will be retrieved from the client-side, the encoded data\n        also contains a hash to ensure that the data was not tampered with.\n        \"\"\"\n        if messages or encode_empty:\n            encoder = MessageEncoder()\n            value = encoder.encode(messages)\n            return self.signer.sign(value)"
        },
        {
          "file": "django/contrib/messages/storage/cookie.py",
          "type": "function",
          "name": "_decode",
          "class_name": "CookieStorage",
          "code": "def _decode(self, data):\n        \"\"\"\n        Safely decode an encoded text stream back into a list of messages.\n\n        If the encoded text stream contained an invalid hash or was in an\n        invalid format, return None.\n        \"\"\"\n        if not data:\n            return None\n        try:\n            decoded = self.signer.unsign(data)\n        except signing.BadSignature:\n            # RemovedInDjango40Warning: when the deprecation ends, replace\n            # with:\n            #   decoded = None.\n            decoded = self._legacy_decode(data)\n        if decoded:\n            try:\n                return json.loads(decoded, cls=MessageDecoder)\n            except json.JSONDecodeError:\n                pass\n        # Mark the data as used (so it gets removed) since something was wrong\n        # with the data.\n        self.used = True\n        return None"
        }
      ]
    },
    {
      "pr_number": 9512,
      "pr_title": "Fixed #28918 -- Fixed Model.refresh_from_db() for instances hidden by the default manager.",
      "pr_body": "https://code.djangoproject.com/ticket/28918",
      "issue_id": 28918,
      "issue_title": "Model.refresh_from_db() should use _base_manager instead of the default_manager",
      "issue_body": "",
      "issue_closed_at": "2017-12-30T17:01:08",
      "base_commit": "dcdd219ee1e062dc6189f382e0298e0adf5d5ddf",
      "changes": [
        {
          "file": "django/db/models/base.py",
          "type": "function",
          "name": "refresh_from_db",
          "class_name": "Model",
          "code": "def refresh_from_db(self, using=None, fields=None):\n        \"\"\"\n        Reload field values from the database.\n\n        By default, the reloading happens from the database this instance was\n        loaded from, or by the read router if this instance wasn't loaded from\n        any database. The using parameter will override the default.\n\n        Fields can be used to specify which fields to reload. The fields\n        should be an iterable of field attnames. If fields is None, then\n        all non-deferred fields are reloaded.\n\n        When accessing deferred fields of an instance, the deferred loading\n        of the field will call this method.\n        \"\"\"\n        if fields is not None:\n            if not fields:\n                return\n            if any(LOOKUP_SEP in f for f in fields):\n                raise ValueError(\n                    'Found \"%s\" in fields argument. Relations and transforms '\n                    'are not allowed in fields.' % LOOKUP_SEP)\n\n        db = using if using is not None else self._state.db\n        db_instance_qs = self.__class__._default_manager.using(db).filter(pk=self.pk)\n\n        # Use provided fields, if not set then reload all non-deferred fields.\n        deferred_fields = self.get_deferred_fields()\n        if fields is not None:\n            fields = list(fields)\n            db_instance_qs = db_instance_qs.only(*fields)\n        elif deferred_fields:\n            fields = [f.attname for f in self._meta.concrete_fields\n                      if f.attname not in deferred_fields]\n            db_instance_qs = db_instance_qs.only(*fields)\n\n        db_instance = db_instance_qs.get()\n        non_loaded_fields = db_instance.get_deferred_fields()\n        for field in self._meta.concrete_fields:\n            if field.attname in non_loaded_fields:\n                # This field wasn't refreshed - skip ahead.\n                continue\n            setattr(self, field.attname, getattr(db_instance, field.attname))\n            # Throw away stale foreign key references.\n            if field.is_relation and field.is_cached(self):\n                rel_instance = field.get_cached_value(self)\n                local_val = getattr(db_instance, field.attname)\n                related_val = None if rel_instance is None else getattr(rel_instance, field.target_field.attname)\n                if local_val != related_val or (local_val is None and related_val is None):\n                    field.delete_cached_value(self)\n\n        # Clear cached relations.\n        for field in self._meta.related_objects:\n            if field.is_cached(self):\n                field.delete_cached_value(self)\n\n        self._state.db = db_instance._state.db"
        }
      ]
    }
  ]
}