{
  "instance_id": "django__django-11905",
  "repo": "django/django",
  "created_at": "2019-10-11T18:19:39Z",
  "problem_statement": "Prevent using __isnull lookup with non-boolean value.\nDescription\n\t \n\t\t(last modified by Mariusz Felisiak)\n\t \n__isnull should not allow for non-boolean values. Using truthy/falsey doesn't promote INNER JOIN to an OUTER JOIN but works fine for a simple queries. Using non-boolean values is \u200bundocumented and untested. IMO we should raise an error for non-boolean values to avoid confusion and for consistency.\n",
  "patch": "diff --git a/django/db/models/lookups.py b/django/db/models/lookups.py\n--- a/django/db/models/lookups.py\n+++ b/django/db/models/lookups.py\n@@ -1,5 +1,6 @@\n import itertools\n import math\n+import warnings\n from copy import copy\n \n from django.core.exceptions import EmptyResultSet\n@@ -9,6 +10,7 @@\n )\n from django.db.models.query_utils import RegisterLookupMixin\n from django.utils.datastructures import OrderedSet\n+from django.utils.deprecation import RemovedInDjango40Warning\n from django.utils.functional import cached_property\n \n \n@@ -463,6 +465,17 @@ class IsNull(BuiltinLookup):\n     prepare_rhs = False\n \n     def as_sql(self, compiler, connection):\n+        if not isinstance(self.rhs, bool):\n+            # When the deprecation ends, replace with:\n+            # raise ValueError(\n+            #     'The QuerySet value for an isnull lookup must be True or '\n+            #     'False.'\n+            # )\n+            warnings.warn(\n+                'Using a non-boolean value for an isnull lookup is '\n+                'deprecated, use True or False instead.',\n+                RemovedInDjango40Warning,\n+            )\n         sql, params = compiler.compile(self.lhs)\n         if self.rhs:\n             return \"%s IS NULL\" % sql, params\n",
  "similar_bug_items": [
    {
      "pr_number": 8754,
      "pr_title": "Fixed #28391 -- Fixed Cast() with CharField and max_length on MySQL.",
      "pr_body": "https://code.djangoproject.com/ticket/28391",
      "issue_id": 28391,
      "issue_title": "Cast doesn't take into account CharField's max_length on MySQL.",
      "issue_body": "",
      "issue_closed_at": "2017-07-17T14:12:39",
      "base_commit": "feeafdad02e2874e2e2f879a825d3527f6b193ad",
      "changes": [
        {
          "file": "django/db/backends/sqlite3/features.py",
          "type": "class",
          "name": "DatabaseFeatures",
          "code": "class DatabaseFeatures(BaseDatabaseFeatures):\n    # SQLite cannot handle us only partially reading from a cursor's result set\n    # and then writing the same rows to the database in another cursor. This\n    # setting ensures we always read result sets fully into memory all in one\n    # go.\n    can_use_chunked_reads = False\n    test_db_allows_multiple_connections = False\n    supports_unspecified_pk = True\n    supports_timezones = False\n    max_query_params = 999\n    supports_mixed_date_datetime_comparisons = False\n    has_bulk_insert = True\n    supports_column_check_constraints = False\n    autocommits_when_autocommit_is_off = True\n    can_introspect_decimal_field = False\n    can_introspect_positive_integer_field = True\n    can_introspect_small_integer_field = True\n    supports_transactions = True\n    atomic_transactions = False\n    can_rollback_ddl = True\n    supports_paramstyle_pyformat = False\n    supports_sequence_reset = False\n    can_clone_databases = True\n    supports_temporal_subtraction = True\n    ignores_table_name_case = True\n\n    @cached_property\n    def uses_savepoints(self):\n        return Database.sqlite_version_info >= (3, 6, 8)\n\n    @cached_property\n    def supports_index_column_ordering(self):\n        return Database.sqlite_version_info >= (3, 3, 0)\n\n    @cached_property\n    def can_release_savepoints(self):\n        return self.uses_savepoints\n\n    @cached_property\n    def can_share_in_memory_db(self):\n        return (\n            Database.__name__ == 'sqlite3.dbapi2' and\n            Database.sqlite_version_info >= (3, 7, 13)\n        )\n\n    @cached_property\n    def supports_stddev(self):\n        \"\"\"\n        Confirm support for STDDEV and related stats functions.\n\n        SQLite supports STDDEV as an extension package; so\n        connection.ops.check_expression_support() can't unilaterally\n        rule out support for STDDEV. Manually check whether the call works.\n        \"\"\"\n        with self.connection.cursor() as cursor:\n            cursor.execute('CREATE TABLE STDDEV_TEST (X INT)')\n            try:\n                cursor.execute('SELECT STDDEV(*) FROM STDDEV_TEST')\n                has_support = True\n            except utils.DatabaseError:\n                has_support = False\n            cursor.execute('DROP TABLE STDDEV_TEST')\n        return has_support"
        },
        {
          "file": "django/db/models/fields/__init__.py",
          "type": "function",
          "name": "clean",
          "class_name": "Field",
          "code": "def clean(self, value, model_instance):\n        \"\"\"\n        Convert the value's type and run validation. Validation errors\n        from to_python() and validate() are propagated. Return the correct\n        value if no error is raised.\n        \"\"\"\n        value = self.to_python(value)\n        self.validate(value, model_instance)\n        self.run_validators(value)\n        return value"
        },
        {
          "file": "django/db/models/fields/__init__.py",
          "type": "function",
          "name": "db_type",
          "class_name": "Field",
          "code": "def db_type(self, connection):\n        \"\"\"\n        Return the database column data type for this field, for the provided\n        connection.\n        \"\"\"\n        # The default implementation of this method looks at the\n        # backend-specific data_types dictionary, looking up the field by its\n        # \"internal type\".\n        #\n        # A Field class can implement the get_internal_type() method to specify\n        # which *preexisting* Django Field class it's most similar to -- i.e.,\n        # a custom field might be represented by a TEXT column type, which is\n        # the same as the TextField Django field type, which means the custom\n        # field's get_internal_type() returns 'TextField'.\n        #\n        # But the limitation of the get_internal_type() / data_types approach\n        # is that it cannot handle database column types that aren't already\n        # mapped to one of the built-in Django field types. In this case, you\n        # can implement db_type() instead of get_internal_type() to specify\n        # exactly which wacky database column type you want to use.\n        data = DictWrapper(self.__dict__, connection.ops.quote_name, \"qn_\")\n        try:\n            return connection.data_types[self.get_internal_type()] % data\n        except KeyError:\n            return None"
        },
        {
          "file": "django/db/models/functions/base.py",
          "type": "class",
          "name": "Cast",
          "code": "class Cast(Func):\n    \"\"\"Coerce an expression to a new field type.\"\"\"\n    function = 'CAST'\n    template = '%(function)s(%(expressions)s AS %(db_type)s)'\n\n    mysql_types = {\n        fields.CharField: 'char',\n        fields.IntegerField: 'signed integer',\n        fields.BigIntegerField: 'signed integer',\n        fields.SmallIntegerField: 'signed integer',\n        fields.FloatField: 'signed',\n        fields.PositiveIntegerField: 'unsigned integer',\n        fields.PositiveSmallIntegerField: 'unsigned integer',\n    }\n\n    def __init__(self, expression, output_field):\n        super().__init__(expression, output_field=output_field)\n\n    def as_sql(self, compiler, connection, **extra_context):\n        if 'db_type' not in extra_context:\n            extra_context['db_type'] = self.output_field.db_type(connection)\n        return super().as_sql(compiler, connection, **extra_context)\n\n    def as_mysql(self, compiler, connection):\n        extra_context = {}\n        output_field_class = type(self.output_field)\n        if output_field_class in self.mysql_types:\n            extra_context['db_type'] = self.mysql_types[output_field_class]\n        return self.as_sql(compiler, connection, **extra_context)\n\n    def as_postgresql(self, compiler, connection):\n        # CAST would be valid too, but the :: shortcut syntax is more readable.\n        return self.as_sql(compiler, connection, template='%(expressions)s::%(db_type)s')"
        },
        {
          "file": "django/db/models/functions/base.py",
          "type": "function",
          "name": "as_mysql",
          "class_name": "Length",
          "code": "def as_mysql(self, compiler, connection):\n        return super().as_sql(compiler, connection, function='CHAR_LENGTH')"
        }
      ]
    },
    {
      "pr_number": 6774,
      "pr_title": "Fixed #26171 -- Made MySQL create an index on ForeignKeys with db_contraint=False.",
      "pr_body": "Refactor \"Prevented unneeded index creation on MySQL-InnoDB\" (2ceb10f)\nto avoid setting db_index = False. Check db_constraint=True before\nskipping the index creation, fixes #26171.\n",
      "issue_id": 26171,
      "issue_title": "ForeignKey with db_constraint=False doesn't generate an index on MySQL",
      "issue_body": "",
      "issue_closed_at": "2016-06-28T07:19:11",
      "base_commit": "5fe1c92250017110430c7c2153cfd8776e4c7064",
      "changes": [
        {
          "file": "django/db/backends/base/schema.py",
          "type": "function",
          "name": "_model_indexes_sql",
          "class_name": "BaseDatabaseSchemaEditor",
          "code": "def _model_indexes_sql(self, model):\n        \"\"\"\n        Return all index SQL statements (field indexes, index_together) for the\n        specified model, as a list.\n        \"\"\"\n        if not model._meta.managed or model._meta.proxy or model._meta.swapped:\n            return []\n        output = []\n        for field in model._meta.local_fields:\n            if field.db_index and not field.unique:\n                output.append(self._create_index_sql(model, [field], suffix=\"\"))\n\n        for field_names in model._meta.index_together:\n            fields = [model._meta.get_field(field) for field in field_names]\n            output.append(self._create_index_sql(model, fields, suffix=\"_idx\"))\n        return output"
        },
        {
          "file": "django/db/backends/base/schema.py",
          "type": "function",
          "name": "_model_indexes_sql",
          "class_name": "BaseDatabaseSchemaEditor",
          "code": "def _model_indexes_sql(self, model):\n        \"\"\"\n        Return all index SQL statements (field indexes, index_together) for the\n        specified model, as a list.\n        \"\"\"\n        if not model._meta.managed or model._meta.proxy or model._meta.swapped:\n            return []\n        output = []\n        for field in model._meta.local_fields:\n            if field.db_index and not field.unique:\n                output.append(self._create_index_sql(model, [field], suffix=\"\"))\n\n        for field_names in model._meta.index_together:\n            fields = [model._meta.get_field(field) for field in field_names]\n            output.append(self._create_index_sql(model, fields, suffix=\"_idx\"))\n        return output"
        },
        {
          "file": "django/db/backends/mysql/schema.py",
          "type": "function",
          "name": "add_field",
          "class_name": "DatabaseSchemaEditor",
          "code": "def add_field(self, model, field):\n        super(DatabaseSchemaEditor, self).add_field(model, field)\n\n        # Simulate the effect of a one-off default.\n        # field.default may be unhashable, so a set isn't used for \"in\" check.\n        if self.skip_default(field) and field.default not in (None, NOT_PROVIDED):\n            effective_default = self.effective_default(field)\n            self.execute('UPDATE %(table)s SET %(column)s = %%s' % {\n                'table': self.quote_name(model._meta.db_table),\n                'column': self.quote_name(field.column),\n            }, [effective_default])"
        }
      ]
    },
    {
      "pr_number": 9964,
      "pr_title": "Fixed #29413 -- Prevented evaluation of QuerySet.get_or_create()/update_or_create() defaults unless needed.",
      "pr_body": "https://code.djangoproject.com/ticket/29413",
      "issue_id": 29413,
      "issue_title": "QuerySet.get_or_create()/update_or_create() shouldn't evaluate lazy defaults unless they are needed",
      "issue_body": "",
      "issue_closed_at": "2018-07-16T21:09:12",
      "base_commit": "4d48ddd8f93800a80330ec1dee7b7d4afe6ea95a",
      "changes": [
        {
          "file": "django/db/models/query.py",
          "type": "function",
          "name": "get_or_create",
          "class_name": "QuerySet",
          "code": "def get_or_create(self, defaults=None, **kwargs):\n        \"\"\"\n        Look up an object with the given kwargs, creating one if necessary.\n        Return a tuple of (object, created), where created is a boolean\n        specifying whether an object was created.\n        \"\"\"\n        lookup, params = self._extract_model_params(defaults, **kwargs)\n        # The get() needs to be targeted at the write database in order\n        # to avoid potential transaction consistency problems.\n        self._for_write = True\n        try:\n            return self.get(**lookup), False\n        except self.model.DoesNotExist:\n            return self._create_object_from_params(lookup, params)"
        },
        {
          "file": "django/db/models/query.py",
          "type": "function",
          "name": "update_or_create",
          "class_name": "QuerySet",
          "code": "def update_or_create(self, defaults=None, **kwargs):\n        \"\"\"\n        Look up an object with the given kwargs, updating one with defaults\n        if it exists, otherwise create a new one.\n        Return a tuple (object, created), where created is a boolean\n        specifying whether an object was created.\n        \"\"\"\n        defaults = defaults or {}\n        lookup, params = self._extract_model_params(defaults, **kwargs)\n        self._for_write = True\n        with transaction.atomic(using=self.db):\n            try:\n                obj = self.select_for_update().get(**lookup)\n            except self.model.DoesNotExist:\n                obj, created = self._create_object_from_params(lookup, params)\n                if created:\n                    return obj, created\n            for k, v in defaults.items():\n                setattr(obj, k, v() if callable(v) else v)\n            obj.save(using=self.db)\n        return obj, False"
        },
        {
          "file": "django/db/models/query.py",
          "type": "function",
          "name": "_create_object_from_params",
          "class_name": "QuerySet",
          "code": "def _create_object_from_params(self, lookup, params):\n        \"\"\"\n        Try to create an object using passed params. Used by get_or_create()\n        and update_or_create().\n        \"\"\"\n        try:\n            with transaction.atomic(using=self.db):\n                params = {k: v() if callable(v) else v for k, v in params.items()}\n                obj = self.create(**params)\n            return obj, True\n        except IntegrityError as e:\n            try:\n                return self.get(**lookup), False\n            except self.model.DoesNotExist:\n                pass\n            raise e"
        },
        {
          "file": "django/db/models/query.py",
          "type": "function",
          "name": "_extract_model_params",
          "class_name": "QuerySet",
          "code": "def _extract_model_params(self, defaults, **kwargs):\n        \"\"\"\n        Prepare `lookup` (kwargs that are valid model attributes), `params`\n        (for creating a model instance) based on given kwargs; for use by\n        get_or_create() and update_or_create().\n        \"\"\"\n        defaults = defaults or {}\n        lookup = kwargs.copy()\n        for f in self.model._meta.fields:\n            if f.attname in lookup:\n                lookup[f.name] = lookup.pop(f.attname)\n        params = {k: v for k, v in kwargs.items() if LOOKUP_SEP not in k}\n        params.update(defaults)\n        property_names = self.model._meta._property_names\n        invalid_params = []\n        for param in params:\n            try:\n                self.model._meta.get_field(param)\n            except exceptions.FieldDoesNotExist:\n                # It's okay to use a model's property if it has a setter.\n                if not (param in property_names and getattr(self.model, param).fset):\n                    invalid_params.append(param)\n        if invalid_params:\n            raise exceptions.FieldError(\n                \"Invalid field name(s) for model %s: '%s'.\" % (\n                    self.model._meta.object_name,\n                    \"', '\".join(sorted(invalid_params)),\n                ))\n        return lookup, params"
        }
      ]
    },
    {
      "pr_number": 9380,
      "pr_title": "Fixed #28834 -- Followed ancestor links on field cache lookup failure.",
      "pr_body": "https://code.djangoproject.com/ticket/28834",
      "issue_id": 28834,
      "issue_title": "Fields cache should attempt to follow ancestor links on lookup failures",
      "issue_body": "",
      "issue_closed_at": "2017-11-29T00:30:02",
      "base_commit": "746caf3ef821dbf7588797cb2600fa81b9df9d1d",
      "changes": [
        {
          "file": "django/db/models/fields/mixins.py",
          "type": "function",
          "name": "get_cached_value",
          "class_name": "FieldCacheMixin",
          "code": "def get_cached_value(self, instance, default=NOT_PROVIDED):\n        cache_name = self.get_cache_name()\n        try:\n            return instance._state.fields_cache[cache_name]\n        except KeyError:\n            if default is NOT_PROVIDED:\n                raise\n            return default"
        }
      ]
    },
    {
      "pr_number": 11263,
      "pr_title": "Fixed #30361 -- Increased the default timeout of watchman client to 5 seconds and made it customizable.",
      "pr_body": "",
      "issue_id": 30361,
      "issue_title": "Watchman timing out when loading server",
      "issue_body": "",
      "issue_closed_at": "2019-04-26T06:35:55",
      "base_commit": "efeceba589974b95b35b2e25df86498c96315518",
      "changes": [
        {
          "file": "django/utils/autoreload.py",
          "type": "class",
          "name": "WatchmanReloader",
          "code": "class WatchmanReloader(BaseReloader):\n    def __init__(self):\n        self.roots = defaultdict(set)\n        self.processed_request = threading.Event()\n        super().__init__()\n\n    @cached_property\n    def client(self):\n        return pywatchman.client()\n\n    def _watch_root(self, root):\n        # In practice this shouldn't occur, however, it's possible that a\n        # directory that doesn't exist yet is being watched. If it's outside of\n        # sys.path then this will end up a new root. How to handle this isn't\n        # clear: Not adding the root will likely break when subscribing to the\n        # changes, however, as this is currently an internal API,  no files\n        # will be being watched outside of sys.path. Fixing this by checking\n        # inside watch_glob() and watch_dir() is expensive, instead this could\n        # could fall back to the StatReloader if this case is detected? For\n        # now, watching its parent, if possible, is sufficient.\n        if not root.exists():\n            if not root.parent.exists():\n                logger.warning('Unable to watch root dir %s as neither it or its parent exist.', root)\n                return\n            root = root.parent\n        result = self.client.query('watch-project', str(root.absolute()))\n        if 'warning' in result:\n            logger.warning('Watchman warning: %s', result['warning'])\n        logger.debug('Watchman watch-project result: %s', result)\n        return result['watch'], result.get('relative_path')\n\n    @functools.lru_cache()\n    def _get_clock(self, root):\n        return self.client.query('clock', root)['clock']\n\n    def _subscribe(self, directory, name, expression):\n        root, rel_path = self._watch_root(directory)\n        query = {\n            'expression': expression,\n            'fields': ['name'],\n            'since': self._get_clock(root),\n            'dedup_results': True,\n        }\n        if rel_path:\n            query['relative_root'] = rel_path\n        logger.debug('Issuing watchman subscription %s, for root %s. Query: %s', name, root, query)\n        self.client.query('subscribe', root, name, query)\n\n    def _subscribe_dir(self, directory, filenames):\n        if not directory.exists():\n            if not directory.parent.exists():\n                logger.warning('Unable to watch directory %s as neither it or its parent exist.', directory)\n                return\n            prefix = 'files-parent-%s' % directory.name\n            filenames = ['%s/%s' % (directory.name, filename) for filename in filenames]\n            directory = directory.parent\n            expression = ['name', filenames, 'wholename']\n        else:\n            prefix = 'files'\n            expression = ['name', filenames]\n        self._subscribe(directory, '%s:%s' % (prefix, directory), expression)\n\n    def _watch_glob(self, directory, patterns):\n        \"\"\"\n        Watch a directory with a specific glob. If the directory doesn't yet\n        exist, attempt to watch the parent directory and amend the patterns to\n        include this. It's important this method isn't called more than one per\n        directory when updating all subscriptions. Subsequent calls will\n        overwrite the named subscription, so it must include all possible glob\n        expressions.\n        \"\"\"\n        prefix = 'glob'\n        if not directory.exists():\n            if not directory.parent.exists():\n                logger.warning('Unable to watch directory %s as neither it or its parent exist.', directory)\n                return\n            prefix = 'glob-parent-%s' % directory.name\n            patterns = ['%s/%s' % (directory.name, pattern) for pattern in patterns]\n            directory = directory.parent\n\n        expression = ['anyof']\n        for pattern in patterns:\n            expression.append(['match', pattern, 'wholename'])\n        self._subscribe(directory, '%s:%s' % (prefix, directory), expression)\n\n    def watched_roots(self, watched_files):\n        extra_directories = self.directory_globs.keys()\n        watched_file_dirs = [f.parent for f in watched_files]\n        sys_paths = list(sys_path_directories())\n        return frozenset((*extra_directories, *watched_file_dirs, *sys_paths))\n\n    def _update_watches(self):\n        watched_files = list(self.watched_files(include_globs=False))\n        found_roots = common_roots(self.watched_roots(watched_files))\n        logger.debug('Watching %s files', len(watched_files))\n        logger.debug('Found common roots: %s', found_roots)\n        # Setup initial roots for performance, shortest roots first.\n        for root in sorted(found_roots):\n            self._watch_root(root)\n        for directory, patterns in self.directory_globs.items():\n            self._watch_glob(directory, patterns)\n        # Group sorted watched_files by their parent directory.\n        sorted_files = sorted(watched_files, key=lambda p: p.parent)\n        for directory, group in itertools.groupby(sorted_files, key=lambda p: p.parent):\n            # These paths need to be relative to the parent directory.\n            self._subscribe_dir(directory, [str(p.relative_to(directory)) for p in group])\n\n    def update_watches(self):\n        try:\n            self._update_watches()\n        except Exception as ex:\n            # If the service is still available, raise the original exception.\n            if self.check_server_status(ex):\n                raise\n\n    def _check_subscription(self, sub):\n        subscription = self.client.getSubscription(sub)\n        if not subscription:\n            return\n        logger.debug('Watchman subscription %s has results.', sub)\n        for result in subscription:\n            # When using watch-project, it's not simple to get the relative\n            # directory without storing some specific state. Store the full\n            # path to the directory in the subscription name, prefixed by its\n            # type (glob, files).\n            root_directory = Path(result['subscription'].split(':', 1)[1])\n            logger.debug('Found root directory %s', root_directory)\n            for file in result.get('files', []):\n                self.notify_file_changed(root_directory / file)\n\n    def request_processed(self, **kwargs):\n        logger.debug('Request processed. Setting update_watches event.')\n        self.processed_request.set()\n\n    def tick(self):\n        request_finished.connect(self.request_processed)\n        self.update_watches()\n        while True:\n            if self.processed_request.is_set():\n                self.update_watches()\n                self.processed_request.clear()\n            try:\n                self.client.receive()\n            except pywatchman.WatchmanError as ex:\n                self.check_server_status(ex)\n            else:\n                for sub in list(self.client.subs.keys()):\n                    self._check_subscription(sub)\n            yield\n\n    def stop(self):\n        self.client.close()\n        super().stop()\n\n    def check_server_status(self, inner_ex=None):\n        \"\"\"Return True if the server is available.\"\"\"\n        try:\n            self.client.query('version')\n        except Exception:\n            raise WatchmanUnavailable(str(inner_ex)) from inner_ex\n        return True\n\n    @classmethod\n    def check_availability(cls):\n        if not pywatchman:\n            raise WatchmanUnavailable('pywatchman not installed.')\n        client = pywatchman.client(timeout=0.01)\n        try:\n            result = client.capabilityCheck()\n        except Exception:\n            # The service is down?\n            raise WatchmanUnavailable('Cannot connect to the watchman service.')\n        version = get_version_tuple(result['version'])\n        # Watchman 4.9 includes multiple improvements to watching project\n        # directories as well as case insensitive filesystems.\n        logger.debug('Watchman version %s', version)\n        if version < (4, 9):\n            raise WatchmanUnavailable('Watchman 4.9 or later is required.')"
        },
        {
          "file": "django/utils/autoreload.py",
          "type": "function",
          "name": "check_server_status",
          "class_name": "WatchmanReloader",
          "code": "def check_server_status(self, inner_ex=None):\n        \"\"\"Return True if the server is available.\"\"\"\n        try:\n            self.client.query('version')\n        except Exception:\n            raise WatchmanUnavailable(str(inner_ex)) from inner_ex\n        return True"
        }
      ]
    }
  ]
}