{
  "Selected_candidate": {
    "pr_number": 10910,
    "pr_title": "Fixed #30128 -- Fixed handling timedelta timezone in database functions.",
    "pr_body": "Ticket: [#30128](https://code.djangoproject.com/ticket/30128)",
    "issue_id": 30128,
    "issue_title": "Using database functions with tzinfo=datetime.timezone(datetime.timedelta(...)) results in an incorrect query",
    "issue_body": "I haven’t checked this bug with other databases, but it definitely works improperly with postgres.\nDjango ORM create incorrect query when I use timezone determined like \"timezone(timedelta(hours=some_hours))\".\n\"timezone(timedelta(hours=5))\" in query will look like \"UTC+05:00\", but postgres doesn't know this timezone name and handle it as POSIX style.\n\"UTC\" part will be interpreted as some zone abbreviation and timezone will be shifted by 5 hours to the west (positive shift is shift to the west in accordance with POSIX standart), i.e. actually timezone will be equal to UTC-5.\nFrom\n​\nhttps://www.postgresql.org/docs/10/datatype-datetime.html\n:\n\"In addition to the timezone names and abbreviations, PostgreSQL will accept POSIX-style time zone specifications of the form STDoffset or STDoffsetDST, where STD is a zone abbreviation, offset is a numeric offset in hours west from UTC\"\nChecked with:\ndjango==2.1.5\npsycopg2==2.7.6.1\npostgreSQL==10.6\nUsing the following example model:\nclass test(models.Model):\n    class Meta:\n        db_table = 'test_timezones'\n\n    datetime = models.DateTimeField()\nSample of bug is bellow:\n>>> from datetime import timezone, timedelta\n>>> from django.db.models.functions import ExtractWeekDay\n>>> from django_issues.models import test\n>>> from django.db.models.functions import ExtractHour\n>>> from pytz import timezone as pytz_timezone\n>>> print(test.objects.annotate(hour=ExtractHour('datetime')).values('datetime', 'hour').get())\n{'datetime': datetime.datetime(2018, 1, 1, 7, 0, tzinfo=<UTC>), 'hour': 7}\n>>> tz = timezone(timedelta(hours=5))\n>>> print(tz)\nUTC+05:00\n>>> print(test.objects.annotate(hour=ExtractHour('datetime', tzinfo=tz)).values('datetime', 'hour').get())\n{'datetime': datetime.datetime(2018, 1, 1, 7, 0, tzinfo=<UTC>), 'hour': 2}\n>>> print(test.objects.annotate(hour=ExtractHour('datetime', tzinfo=tz)).values('datetime', 'hour').query)\nSELECT \"test_timezones\".\"datetime\", EXTRACT('hour' FROM \"test_timezones\".\"datetime\" AT TIME ZONE 'UTC+05:00') AS \"hour\" FROM \"test_timezones\"\n>>> tz2 = pytz_timezone('Asia/Yekaterinburg')\n>>> print(tz2)\nAsia/Yekaterinburg\n>>> print(test.objects.annotate(hour=ExtractHour('datetime', tzinfo=tz2)).values('datetime', 'hour').get())\n{'datetime': datetime.datetime(2018, 1, 1, 7, 0, tzinfo=<UTC>), 'hour': 12}",
    "issue_closed_at": "2019-06-13T03:17:18",
    "base_commit": "3dca8738cbbbb5674f795169e5ea25e2002f2d71",
    "changes": [
      {
        "file": "django/db/backends/mysql/operations.py",
        "type": "function",
        "name": "date_trunc_sql",
        "class_name": "DatabaseOperations",
        "code": "def date_trunc_sql(self, lookup_type, field_name):\n        fields = {\n            'year': '%%Y-01-01',\n            'month': '%%Y-%%m-01',\n        }  # Use double percents to escape.\n        if lookup_type in fields:\n            format_str = fields[lookup_type]\n            return \"CAST(DATE_FORMAT(%s, '%s') AS DATE)\" % (field_name, format_str)\n        elif lookup_type == 'quarter':\n            return \"MAKEDATE(YEAR(%s), 1) + INTERVAL QUARTER(%s) QUARTER - INTERVAL 1 QUARTER\" % (\n                field_name, field_name\n            )\n        elif lookup_type == 'week':\n            return \"DATE_SUB(%s, INTERVAL WEEKDAY(%s) DAY)\" % (\n                field_name, field_name\n            )\n        else:\n            return \"DATE(%s)\" % (field_name)"
      },
      {
        "file": "django/db/backends/oracle/operations.py",
        "type": "function",
        "name": "date_trunc_sql",
        "class_name": "DatabaseOperations",
        "code": "def date_trunc_sql(self, lookup_type, field_name):\n        # https://docs.oracle.com/en/database/oracle/oracle-database/18/sqlrf/ROUND-and-TRUNC-Date-Functions.html\n        if lookup_type in ('year', 'month'):\n            return \"TRUNC(%s, '%s')\" % (field_name, lookup_type.upper())\n        elif lookup_type == 'quarter':\n            return \"TRUNC(%s, 'Q')\" % field_name\n        elif lookup_type == 'week':\n            return \"TRUNC(%s, 'IW')\" % field_name\n        else:\n            return \"TRUNC(%s)\" % field_name"
      },
      {
        "file": "django/db/backends/oracle/operations.py",
        "type": "function",
        "name": "_convert_field_to_tz",
        "class_name": "DatabaseOperations",
        "code": "def _convert_field_to_tz(self, field_name, tzname):\n        if not settings.USE_TZ:\n            return field_name\n        if not self._tzname_re.match(tzname):\n            raise ValueError(\"Invalid time zone name: %s\" % tzname)\n        # Convert from connection timezone to the local time, returning\n        # TIMESTAMP WITH TIME ZONE and cast it back to TIMESTAMP to strip the\n        # TIME ZONE details.\n        if self.connection.timezone_name != tzname:\n            return \"CAST((FROM_TZ(%s, '%s') AT TIME ZONE '%s') AS TIMESTAMP)\" % (\n                field_name,\n                self.connection.timezone_name,\n                tzname,\n            )\n        return field_name"
      },
      {
        "file": "django/db/backends/postgresql/operations.py",
        "type": "function",
        "name": "date_trunc_sql",
        "class_name": "DatabaseOperations",
        "code": "def date_trunc_sql(self, lookup_type, field_name):\n        # https://www.postgresql.org/docs/current/functions-datetime.html#FUNCTIONS-DATETIME-TRUNC\n        return \"DATE_TRUNC('%s', %s)\" % (lookup_type, field_name)"
      },
      {
        "file": "django/db/backends/sqlite3/base.py",
        "type": "function",
        "name": "_sqlite_datetime_parse",
        "class_name": null,
        "code": "def _sqlite_datetime_parse(dt, tzname=None, conn_tzname=None):\n    if dt is None:\n        return None\n    try:\n        dt = backend_utils.typecast_timestamp(dt)\n    except (TypeError, ValueError):\n        return None\n    if conn_tzname:\n        dt = dt.replace(tzinfo=pytz.timezone(conn_tzname))\n    if tzname is not None and tzname != conn_tzname:\n        dt = timezone.localtime(dt, pytz.timezone(tzname))\n    return dt"
      }
    ]
  },
  "Justification": "Candidate D is the most helpful report because it addresses similar issues of incorrect SQL generation in Django's ORM, specifically with regard to the handling of timezones and datetime values. Both the CURRENT bug and Candidate D deal with how queries constructed in Django lead to unexpected SQL output. Additionally, Candidate D's bug fix pertained to adjustments in the way that timezones and datetime fields are processed by the database backends, which may provide relevant insights into the GROUP BY issue experienced in the CURRENT bug when filtering users. This similarity in the problems and their contexts makes Candidate D especially useful for debugging the CURRENT bug.",
  "instance_id": "django__django-11797",
  "repo": "django/django",
  "created_at": "2019-09-20T02:23:19Z",
  "problem_statement": "Filtering on query result overrides GROUP BY of internal query\nDescription\n\t\nfrom django.contrib.auth import models\na = models.User.objects.filter(email__isnull=True).values('email').annotate(m=Max('id')).values('m')\nprint(a.query) # good\n# SELECT MAX(\"auth_user\".\"id\") AS \"m\" FROM \"auth_user\" WHERE \"auth_user\".\"email\" IS NULL GROUP BY \"auth_user\".\"email\"\nprint(a[:1].query) # good\n# SELECT MAX(\"auth_user\".\"id\") AS \"m\" FROM \"auth_user\" WHERE \"auth_user\".\"email\" IS NULL GROUP BY \"auth_user\".\"email\" LIMIT 1\nb = models.User.objects.filter(id=a[:1])\nprint(b.query) # GROUP BY U0.\"id\" should be GROUP BY U0.\"email\"\n# SELECT ... FROM \"auth_user\" WHERE \"auth_user\".\"id\" = (SELECT U0.\"id\" FROM \"auth_user\" U0 WHERE U0.\"email\" IS NULL GROUP BY U0.\"id\" LIMIT 1)\n",
  "patch": "diff --git a/django/db/models/lookups.py b/django/db/models/lookups.py\n--- a/django/db/models/lookups.py\n+++ b/django/db/models/lookups.py\n@@ -262,9 +262,9 @@ def process_rhs(self, compiler, connection):\n         from django.db.models.sql.query import Query\n         if isinstance(self.rhs, Query):\n             if self.rhs.has_limit_one():\n-                # The subquery must select only the pk.\n-                self.rhs.clear_select_clause()\n-                self.rhs.add_fields(['pk'])\n+                if not self.rhs.has_select_fields:\n+                    self.rhs.clear_select_clause()\n+                    self.rhs.add_fields(['pk'])\n             else:\n                 raise ValueError(\n                     'The QuerySet value for an exact lookup must be limited to '\n"
}