{
  "instance_id": "django__django-13964",
  "repo": "django/django",
  "created_at": "2021-02-02T17:07:43Z",
  "problem_statement": "Saving parent object after setting on child leads to data loss for parents with non-numeric primary key.\nDescription\n\t \n\t\t(last modified by Charlie DeTar)\n\t \nGiven a model with a foreign key relation to another model that has a non-auto CharField as its primary key:\nclass Product(models.Model):\n\tsku = models.CharField(primary_key=True, max_length=50)\nclass Order(models.Model):\n\tproduct = models.ForeignKey(Product, on_delete=models.CASCADE)\nIf the relation is initialized on the parent with an empty instance that does not yet specify its primary key, and the primary key is subsequently defined, the parent does not \"see\" the primary key's change:\nwith transaction.atomic():\n\torder = Order()\n\torder.product = Product()\n\torder.product.sku = \"foo\"\n\torder.product.save()\n\torder.save()\n\tassert Order.objects.filter(product_id=\"\").exists() # Succeeds, but shouldn't\n\tassert Order.objects.filter(product=order.product).exists() # Fails\nInstead of product_id being populated with product.sku, it is set to emptystring. The foreign key constraint which would enforce the existence of a product with sku=\"\" is deferred until the transaction commits. The transaction does correctly fail on commit with a ForeignKeyViolation due to the non-existence of a product with emptystring as its primary key.\nOn the other hand, if the related unsaved instance is initialized with its primary key before assignment to the parent, it is persisted correctly:\nwith transaction.atomic():\n\torder = Order()\n\torder.product = Product(sku=\"foo\")\n\torder.product.save()\n\torder.save()\n\tassert Order.objects.filter(product=order.product).exists() # succeeds\nCommitting the transaction also succeeds.\nThis may have something to do with how the Order.product_id field is handled at assignment, together with something about handling fetching of auto vs non-auto primary keys from the related instance.\n",
  "patch": "diff --git a/django/db/models/base.py b/django/db/models/base.py\n--- a/django/db/models/base.py\n+++ b/django/db/models/base.py\n@@ -933,7 +933,7 @@ def _prepare_related_fields_for_save(self, operation_name):\n                         \"%s() prohibited to prevent data loss due to unsaved \"\n                         \"related object '%s'.\" % (operation_name, field.name)\n                     )\n-                elif getattr(self, field.attname) is None:\n+                elif getattr(self, field.attname) in field.empty_values:\n                     # Use pk from related object if it has been saved after\n                     # an assignment.\n                     setattr(self, field.attname, obj.pk)\n",
  "similar_bug_items": [
    {
      "pr_number": 7097,
      "pr_title": "Fixed #27068 -- Unified form field initial data retrieval.",
      "pr_body": "https://code.djangoproject.com/ticket/27068\n",
      "issue_id": 27068,
      "issue_title": "Acquire form's initial data more consistently",
      "issue_body": "",
      "issue_closed_at": "2016-08-18T19:51:32",
      "base_commit": "13857b45ca54a519a58361238442af84262c0d23",
      "changes": [
        {
          "file": "django/forms/boundfield.py",
          "type": "function",
          "name": "value",
          "class_name": "BoundField",
          "code": "def value(self):\n        \"\"\"\n        Returns the value for this BoundField, using the initial value if\n        the form is not bound or the data otherwise.\n        \"\"\"\n        if not self.form.is_bound:\n            data = self.initial\n        else:\n            data = self.field.bound_data(\n                self.data, self.form.initial.get(self.name, self.field.initial)\n            )\n        return self.field.prepare_value(data)"
        },
        {
          "file": "django/forms/boundfield.py",
          "type": "function",
          "name": "id_for_label",
          "class_name": "BoundField",
          "code": "def id_for_label(self):\n        \"\"\"\n        Wrapper around the field widget's `id_for_label` method.\n        Useful, for example, for focusing on this field regardless of whether\n        it has a single widget or a MultiWidget.\n        \"\"\"\n        widget = self.field.widget\n        id_ = widget.attrs.get('id') or self.auto_id\n        return widget.id_for_label(id_)"
        },
        {
          "file": "django/forms/forms.py",
          "type": "function",
          "name": "_clean_fields",
          "class_name": "BaseForm",
          "code": "def _clean_fields(self):\n        for name, field in self.fields.items():\n            # value_from_datadict() gets the data from the data dictionaries.\n            # Each widget type knows how to retrieve its own data, because some\n            # widgets split data over several HTML fields.\n            if field.disabled:\n                value = self.initial.get(name, field.initial)\n            else:\n                value = field.widget.value_from_datadict(self.data, self.files, self.add_prefix(name))\n            try:\n                if isinstance(field, FileField):\n                    initial = self.initial.get(name, field.initial)\n                    value = field.clean(value, initial)\n                else:\n                    value = field.clean(value)\n                self.cleaned_data[name] = value\n                if hasattr(self, 'clean_%s' % name):\n                    value = getattr(self, 'clean_%s' % name)()\n                    self.cleaned_data[name] = value\n            except ValidationError as e:\n                self.add_error(name, e)"
        },
        {
          "file": "django/forms/forms.py",
          "type": "function",
          "name": "changed_data",
          "class_name": "BaseForm",
          "code": "def changed_data(self):\n        data = []\n        for name, field in self.fields.items():\n            prefixed_name = self.add_prefix(name)\n            data_value = field.widget.value_from_datadict(self.data, self.files, prefixed_name)\n            if not field.show_hidden_initial:\n                initial_value = self.initial.get(name, field.initial)\n                if callable(initial_value):\n                    initial_value = initial_value()\n            else:\n                initial_prefixed_name = self.add_initial_prefix(name)\n                hidden_widget = field.hidden_widget()\n                try:\n                    initial_value = field.to_python(hidden_widget.value_from_datadict(\n                        self.data, self.files, initial_prefixed_name))\n                except ValidationError:\n                    # Always assume data has changed if validation fails.\n                    data.append(name)\n                    continue\n            if field.has_changed(initial_value, data_value):\n                data.append(name)\n        return data"
        },
        {
          "file": "django/forms/forms.py",
          "type": "function",
          "name": "visible_fields",
          "class_name": "BaseForm",
          "code": "def visible_fields(self):\n        \"\"\"\n        Returns a list of BoundField objects that aren't hidden fields.\n        The opposite of the hidden_fields() method.\n        \"\"\"\n        return [field for field in self if not field.is_hidden]"
        }
      ]
    },
    {
      "pr_number": 11005,
      "pr_title": "Fixed #30183 -- Added parsing of inline SQLite constraints.",
      "pr_body": "",
      "issue_id": 30183,
      "issue_title": "SQLite instrospection.get_constraints() for unique constraints return wrong count of constraints and doesn't have columns for all items",
      "issue_body": "",
      "issue_closed_at": "2019-03-13T11:19:22",
      "base_commit": "406de977ea1a6429535d21240e3ecdac06d4516c",
      "changes": [
        {
          "file": "django/db/backends/sqlite3/introspection.py",
          "type": "function",
          "name": "_get_foreign_key_constraints",
          "class_name": "DatabaseIntrospection",
          "code": "def _get_foreign_key_constraints(self, cursor, table_name):\n        constraints = {}\n        cursor.execute('PRAGMA foreign_key_list(%s)' % self.connection.ops.quote_name(table_name))\n        for row in cursor.fetchall():\n            # Remaining on_update/on_delete/match values are of no interest.\n            id_, _, table, from_, to = row[:5]\n            constraints['fk_%d' % id_] = {\n                'columns': [from_],\n                'primary_key': False,\n                'unique': False,\n                'foreign_key': (table, to),\n                'check': False,\n                'index': False,\n            }\n        return constraints"
        },
        {
          "file": "django/db/backends/sqlite3/introspection.py",
          "type": "function",
          "name": "get_constraints",
          "class_name": "DatabaseIntrospection",
          "code": "def get_constraints(self, cursor, table_name):\n        \"\"\"\n        Retrieve any constraints or keys (unique, pk, fk, check, index) across\n        one or more columns.\n        \"\"\"\n        constraints = {}\n        # Find inline check constraints.\n        try:\n            table_schema = cursor.execute(\n                \"SELECT sql FROM sqlite_master WHERE type='table' and name=%s\" % (\n                    self.connection.ops.quote_name(table_name),\n                )\n            ).fetchone()[0]\n        except TypeError:\n            # table_name is a view.\n            pass\n        else:\n            constraints.update(self._parse_table_constraints(table_schema))\n\n        # Get the index info\n        cursor.execute(\"PRAGMA index_list(%s)\" % self.connection.ops.quote_name(table_name))\n        for row in cursor.fetchall():\n            # SQLite 3.8.9+ has 5 columns, however older versions only give 3\n            # columns. Discard last 2 columns if there.\n            number, index, unique = row[:3]\n            # Get the index info for that index\n            cursor.execute('PRAGMA index_info(%s)' % self.connection.ops.quote_name(index))\n            for index_rank, column_rank, column in cursor.fetchall():\n                if index not in constraints:\n                    constraints[index] = {\n                        \"columns\": [],\n                        \"primary_key\": False,\n                        \"unique\": bool(unique),\n                        \"foreign_key\": None,\n                        \"check\": False,\n                        \"index\": True,\n                    }\n                constraints[index]['columns'].append(column)\n            # Add type and column orders for indexes\n            if constraints[index]['index'] and not constraints[index]['unique']:\n                # SQLite doesn't support any index type other than b-tree\n                constraints[index]['type'] = Index.suffix\n                cursor.execute(\n                    \"SELECT sql FROM sqlite_master \"\n                    \"WHERE type='index' AND name=%s\" % self.connection.ops.quote_name(index)\n                )\n                orders = []\n                # There would be only 1 row to loop over\n                for sql, in cursor.fetchall():\n                    order_info = sql.split('(')[-1].split(')')[0].split(',')\n                    orders = ['DESC' if info.endswith('DESC') else 'ASC' for info in order_info]\n                constraints[index]['orders'] = orders\n        # Get the PK\n        pk_column = self.get_primary_key_column(cursor, table_name)\n        if pk_column:\n            # SQLite doesn't actually give a name to the PK constraint,\n            # so we invent one. This is fine, as the SQLite backend never\n            # deletes PK constraints by name, as you can't delete constraints\n            # in SQLite; we remake the table with a new PK instead.\n            constraints[\"__primary__\"] = {\n                \"columns\": [pk_column],\n                \"primary_key\": True,\n                \"unique\": False,  # It's not actually a unique constraint.\n                \"foreign_key\": None,\n                \"check\": False,\n                \"index\": False,\n            }\n        constraints.update(self._get_foreign_key_constraints(cursor, table_name))\n        return constraints"
        },
        {
          "file": "django/db/backends/sqlite3/introspection.py",
          "type": "function",
          "name": "get_constraints",
          "class_name": "DatabaseIntrospection",
          "code": "def get_constraints(self, cursor, table_name):\n        \"\"\"\n        Retrieve any constraints or keys (unique, pk, fk, check, index) across\n        one or more columns.\n        \"\"\"\n        constraints = {}\n        # Find inline check constraints.\n        try:\n            table_schema = cursor.execute(\n                \"SELECT sql FROM sqlite_master WHERE type='table' and name=%s\" % (\n                    self.connection.ops.quote_name(table_name),\n                )\n            ).fetchone()[0]\n        except TypeError:\n            # table_name is a view.\n            pass\n        else:\n            constraints.update(self._parse_table_constraints(table_schema))\n\n        # Get the index info\n        cursor.execute(\"PRAGMA index_list(%s)\" % self.connection.ops.quote_name(table_name))\n        for row in cursor.fetchall():\n            # SQLite 3.8.9+ has 5 columns, however older versions only give 3\n            # columns. Discard last 2 columns if there.\n            number, index, unique = row[:3]\n            # Get the index info for that index\n            cursor.execute('PRAGMA index_info(%s)' % self.connection.ops.quote_name(index))\n            for index_rank, column_rank, column in cursor.fetchall():\n                if index not in constraints:\n                    constraints[index] = {\n                        \"columns\": [],\n                        \"primary_key\": False,\n                        \"unique\": bool(unique),\n                        \"foreign_key\": None,\n                        \"check\": False,\n                        \"index\": True,\n                    }\n                constraints[index]['columns'].append(column)\n            # Add type and column orders for indexes\n            if constraints[index]['index'] and not constraints[index]['unique']:\n                # SQLite doesn't support any index type other than b-tree\n                constraints[index]['type'] = Index.suffix\n                cursor.execute(\n                    \"SELECT sql FROM sqlite_master \"\n                    \"WHERE type='index' AND name=%s\" % self.connection.ops.quote_name(index)\n                )\n                orders = []\n                # There would be only 1 row to loop over\n                for sql, in cursor.fetchall():\n                    order_info = sql.split('(')[-1].split(')')[0].split(',')\n                    orders = ['DESC' if info.endswith('DESC') else 'ASC' for info in order_info]\n                constraints[index]['orders'] = orders\n        # Get the PK\n        pk_column = self.get_primary_key_column(cursor, table_name)\n        if pk_column:\n            # SQLite doesn't actually give a name to the PK constraint,\n            # so we invent one. This is fine, as the SQLite backend never\n            # deletes PK constraints by name, as you can't delete constraints\n            # in SQLite; we remake the table with a new PK instead.\n            constraints[\"__primary__\"] = {\n                \"columns\": [pk_column],\n                \"primary_key\": True,\n                \"unique\": False,  # It's not actually a unique constraint.\n                \"foreign_key\": None,\n                \"check\": False,\n                \"index\": False,\n            }\n        constraints.update(self._get_foreign_key_constraints(cursor, table_name))\n        return constraints"
        },
        {
          "file": "django/db/backends/sqlite3/introspection.py",
          "type": "function",
          "name": "get_constraints",
          "class_name": "DatabaseIntrospection",
          "code": "def get_constraints(self, cursor, table_name):\n        \"\"\"\n        Retrieve any constraints or keys (unique, pk, fk, check, index) across\n        one or more columns.\n        \"\"\"\n        constraints = {}\n        # Find inline check constraints.\n        try:\n            table_schema = cursor.execute(\n                \"SELECT sql FROM sqlite_master WHERE type='table' and name=%s\" % (\n                    self.connection.ops.quote_name(table_name),\n                )\n            ).fetchone()[0]\n        except TypeError:\n            # table_name is a view.\n            pass\n        else:\n            constraints.update(self._parse_table_constraints(table_schema))\n\n        # Get the index info\n        cursor.execute(\"PRAGMA index_list(%s)\" % self.connection.ops.quote_name(table_name))\n        for row in cursor.fetchall():\n            # SQLite 3.8.9+ has 5 columns, however older versions only give 3\n            # columns. Discard last 2 columns if there.\n            number, index, unique = row[:3]\n            # Get the index info for that index\n            cursor.execute('PRAGMA index_info(%s)' % self.connection.ops.quote_name(index))\n            for index_rank, column_rank, column in cursor.fetchall():\n                if index not in constraints:\n                    constraints[index] = {\n                        \"columns\": [],\n                        \"primary_key\": False,\n                        \"unique\": bool(unique),\n                        \"foreign_key\": None,\n                        \"check\": False,\n                        \"index\": True,\n                    }\n                constraints[index]['columns'].append(column)\n            # Add type and column orders for indexes\n            if constraints[index]['index'] and not constraints[index]['unique']:\n                # SQLite doesn't support any index type other than b-tree\n                constraints[index]['type'] = Index.suffix\n                cursor.execute(\n                    \"SELECT sql FROM sqlite_master \"\n                    \"WHERE type='index' AND name=%s\" % self.connection.ops.quote_name(index)\n                )\n                orders = []\n                # There would be only 1 row to loop over\n                for sql, in cursor.fetchall():\n                    order_info = sql.split('(')[-1].split(')')[0].split(',')\n                    orders = ['DESC' if info.endswith('DESC') else 'ASC' for info in order_info]\n                constraints[index]['orders'] = orders\n        # Get the PK\n        pk_column = self.get_primary_key_column(cursor, table_name)\n        if pk_column:\n            # SQLite doesn't actually give a name to the PK constraint,\n            # so we invent one. This is fine, as the SQLite backend never\n            # deletes PK constraints by name, as you can't delete constraints\n            # in SQLite; we remake the table with a new PK instead.\n            constraints[\"__primary__\"] = {\n                \"columns\": [pk_column],\n                \"primary_key\": True,\n                \"unique\": False,  # It's not actually a unique constraint.\n                \"foreign_key\": None,\n                \"check\": False,\n                \"index\": False,\n            }\n        constraints.update(self._get_foreign_key_constraints(cursor, table_name))\n        return constraints"
        }
      ]
    },
    {
      "pr_number": 9112,
      "pr_title": "Fixed #27846 -- clear all cached reverse relationships on refresh_from_db()",
      "pr_body": "https://code.djangoproject.com/ticket/27846",
      "issue_id": 27846,
      "issue_title": "refresh_from_db() doesn't clear reverse OneToOneFields",
      "issue_body": "",
      "issue_closed_at": "2017-10-12T16:25:22",
      "base_commit": "df0aebc893973c78d7d2cda712ba4133dbe29b6e",
      "changes": [
        {
          "file": "django/db/models/base.py",
          "type": "function",
          "name": "refresh_from_db",
          "class_name": "Model",
          "code": "def refresh_from_db(self, using=None, fields=None):\n        \"\"\"\n        Reload field values from the database.\n\n        By default, the reloading happens from the database this instance was\n        loaded from, or by the read router if this instance wasn't loaded from\n        any database. The using parameter will override the default.\n\n        Fields can be used to specify which fields to reload. The fields\n        should be an iterable of field attnames. If fields is None, then\n        all non-deferred fields are reloaded.\n\n        When accessing deferred fields of an instance, the deferred loading\n        of the field will call this method.\n        \"\"\"\n        if fields is not None:\n            if len(fields) == 0:\n                return\n            if any(LOOKUP_SEP in f for f in fields):\n                raise ValueError(\n                    'Found \"%s\" in fields argument. Relations and transforms '\n                    'are not allowed in fields.' % LOOKUP_SEP)\n\n        db = using if using is not None else self._state.db\n        db_instance_qs = self.__class__._default_manager.using(db).filter(pk=self.pk)\n\n        # Use provided fields, if not set then reload all non-deferred fields.\n        deferred_fields = self.get_deferred_fields()\n        if fields is not None:\n            fields = list(fields)\n            db_instance_qs = db_instance_qs.only(*fields)\n        elif deferred_fields:\n            fields = [f.attname for f in self._meta.concrete_fields\n                      if f.attname not in deferred_fields]\n            db_instance_qs = db_instance_qs.only(*fields)\n\n        db_instance = db_instance_qs.get()\n        non_loaded_fields = db_instance.get_deferred_fields()\n        for field in self._meta.concrete_fields:\n            if field.attname in non_loaded_fields:\n                # This field wasn't refreshed - skip ahead.\n                continue\n            setattr(self, field.attname, getattr(db_instance, field.attname))\n            # Throw away stale foreign key references.\n            if field.is_relation and field.is_cached(self):\n                rel_instance = field.get_cached_value(self)\n                local_val = getattr(db_instance, field.attname)\n                related_val = None if rel_instance is None else getattr(rel_instance, field.target_field.attname)\n                if local_val != related_val or (local_val is None and related_val is None):\n                    field.delete_cached_value(self)\n        self._state.db = db_instance._state.db"
        }
      ]
    },
    {
      "pr_number": 8626,
      "pr_title": "Fixed #26362 -- Update the inherited id field of an object when its ancestor changes",
      "pr_body": "https://code.djangoproject.com/ticket/26362",
      "issue_id": 26362,
      "issue_title": "Manually changing the parent of a child model is silently failing.",
      "issue_body": "",
      "issue_closed_at": "2017-06-26T11:11:44",
      "base_commit": "fa283067c94546e38a7c4c3748c5fd31c58b7f22",
      "changes": [
        {
          "file": "django/db/models/fields/related_descriptors.py",
          "type": "function",
          "name": "get_object",
          "class_name": "ForwardOneToOneDescriptor",
          "code": "def get_object(self, instance):\n        if self.field.remote_field.parent_link:\n            deferred = instance.get_deferred_fields()\n            # Because it's a parent link, all the data is available in the\n            # instance, so populate the parent model with this data.\n            rel_model = self.field.remote_field.model\n            fields = [field.attname for field in rel_model._meta.concrete_fields]\n\n            # If any of the related model's fields are deferred, fallback to\n            # fetching all fields from the related model. This avoids a query\n            # on the related model for every deferred field.\n            if not any(field in fields for field in deferred):\n                kwargs = {field: getattr(instance, field) for field in fields}\n                obj = rel_model(**kwargs)\n                obj._state.adding = instance._state.adding\n                obj._state.db = instance._state.db\n                return obj\n        return super().get_object(instance)"
        }
      ]
    },
    {
      "pr_number": 9902,
      "pr_title": "Fixed #29367 -- Fixed model state on objects with a primary key created with QuerySet.bulk_create().",
      "pr_body": "Instance of models with manually set primary_key persisted with\r\nbulk_create would not update the state `adding` and `db` attributes.\r\n\r\nSee: ticket 29367\r\n",
      "issue_id": 29367,
      "issue_title": "bulk_create with manual primary_key don't update instances state",
      "issue_body": "",
      "issue_closed_at": "2018-04-27T17:20:07",
      "base_commit": "3246ad106517e61437f80e8ef3c9d216754039e7",
      "changes": [
        {
          "file": "django/db/models/query.py",
          "type": "function",
          "name": "bulk_create",
          "class_name": "QuerySet",
          "code": "def bulk_create(self, objs, batch_size=None):\n        \"\"\"\n        Insert each of the instances into the database. Do *not* call\n        save() on each of the instances, do not send any pre/post_save\n        signals, and do not set the primary key attribute if it is an\n        autoincrement field (except if features.can_return_ids_from_bulk_insert=True).\n        Multi-table models are not supported.\n        \"\"\"\n        # When you bulk insert you don't get the primary keys back (if it's an\n        # autoincrement, except if can_return_ids_from_bulk_insert=True), so\n        # you can't insert into the child tables which references this. There\n        # are two workarounds:\n        # 1) This could be implemented if you didn't have an autoincrement pk\n        # 2) You could do it by doing O(n) normal inserts into the parent\n        #    tables to get the primary keys back and then doing a single bulk\n        #    insert into the childmost table.\n        # We currently set the primary keys on the objects when using\n        # PostgreSQL via the RETURNING ID clause. It should be possible for\n        # Oracle as well, but the semantics for extracting the primary keys is\n        # trickier so it's not done yet.\n        assert batch_size is None or batch_size > 0\n        # Check that the parents share the same concrete model with the our\n        # model to detect the inheritance pattern ConcreteGrandParent ->\n        # MultiTableParent -> ProxyChild. Simply checking self.model._meta.proxy\n        # would not identify that case as involving multiple tables.\n        for parent in self.model._meta.get_parent_list():\n            if parent._meta.concrete_model is not self.model._meta.concrete_model:\n                raise ValueError(\"Can't bulk create a multi-table inherited model\")\n        if not objs:\n            return objs\n        self._for_write = True\n        connection = connections[self.db]\n        fields = self.model._meta.concrete_fields\n        objs = list(objs)\n        self._populate_pk_values(objs)\n        with transaction.atomic(using=self.db, savepoint=False):\n            objs_with_pk, objs_without_pk = partition(lambda o: o.pk is None, objs)\n            if objs_with_pk:\n                self._batched_insert(objs_with_pk, fields, batch_size)\n            if objs_without_pk:\n                fields = [f for f in fields if not isinstance(f, AutoField)]\n                ids = self._batched_insert(objs_without_pk, fields, batch_size)\n                if connection.features.can_return_ids_from_bulk_insert:\n                    assert len(ids) == len(objs_without_pk)\n                for obj_without_pk, pk in zip(objs_without_pk, ids):\n                    obj_without_pk.pk = pk\n                    obj_without_pk._state.adding = False\n                    obj_without_pk._state.db = self.db\n\n        return objs"
        }
      ]
    }
  ]
}