{
  "instance_id": "django__django-15202",
  "repo": "django/django",
  "created_at": "2021-12-15T15:04:13Z",
  "problem_statement": "URLField throws ValueError instead of ValidationError on clean\nDescription\n\t\nforms.URLField( ).clean('////]@N.AN')\nresults in:\n\tValueError: Invalid IPv6 URL\n\tTraceback (most recent call last):\n\t File \"basic_fuzzer.py\", line 22, in TestOneInput\n\t File \"fuzzers.py\", line 350, in test_forms_URLField\n\t File \"django/forms/fields.py\", line 151, in clean\n\t File \"django/forms/fields.py\", line 136, in run_validators\n\t File \"django/core/validators.py\", line 130, in __call__\n\t File \"urllib/parse.py\", line 440, in urlsplit\n",
  "patch": "diff --git a/django/core/validators.py b/django/core/validators.py\n--- a/django/core/validators.py\n+++ b/django/core/validators.py\n@@ -108,15 +108,16 @@ def __call__(self, value):\n             raise ValidationError(self.message, code=self.code, params={'value': value})\n \n         # Then check full URL\n+        try:\n+            splitted_url = urlsplit(value)\n+        except ValueError:\n+            raise ValidationError(self.message, code=self.code, params={'value': value})\n         try:\n             super().__call__(value)\n         except ValidationError as e:\n             # Trivial case failed. Try for possible IDN domain\n             if value:\n-                try:\n-                    scheme, netloc, path, query, fragment = urlsplit(value)\n-                except ValueError:  # for example, \"Invalid IPv6 URL\"\n-                    raise ValidationError(self.message, code=self.code, params={'value': value})\n+                scheme, netloc, path, query, fragment = splitted_url\n                 try:\n                     netloc = punycode(netloc)  # IDN -> ACE\n                 except UnicodeError:  # invalid domain part\n@@ -127,7 +128,7 @@ def __call__(self, value):\n                 raise\n         else:\n             # Now verify IPv6 in the netloc part\n-            host_match = re.search(r'^\\[(.+)\\](?::\\d{1,5})?$', urlsplit(value).netloc)\n+            host_match = re.search(r'^\\[(.+)\\](?::\\d{1,5})?$', splitted_url.netloc)\n             if host_match:\n                 potential_ip = host_match[1]\n                 try:\n@@ -139,7 +140,7 @@ def __call__(self, value):\n         # section 3.1. It's defined to be 255 bytes or less, but this includes\n         # one byte for the length of the name and one byte for the trailing dot\n         # that's used to indicate absolute names in DNS.\n-        if len(urlsplit(value).hostname) > 253:\n+        if splitted_url.hostname is None or len(splitted_url.hostname) > 253:\n             raise ValidationError(self.message, code=self.code, params={'value': value})\n \n \n",
  "similar_bug_items": [
    {
      "pr_number": 11886,
      "pr_title": "Fixed #30405 -- Fixed source code mismatch crash in ExceptionReporter. ",
      "pr_body": "[ticket 30405](https://code.djangoproject.com/ticket/30405)",
      "issue_id": 30405,
      "issue_title": "IndexError in _get_lines_from_file when module does not match file contents (via loader)",
      "issue_body": "self = <django.views.debug.ExceptionReporter object at 0x7f2a7908ac18>\nfilename = '…/project/.venv/lib/python3.7/site-packages/pdb.py'\nlineno = 230\ncontext_lines = 7\nloader = <_frozen_importlib_external.SourceFileLoader object at 0x7f2a73609278>\nmodule_name = 'pdb'\n\n[23]   …/Vcs/django/django/core/handlers/exception.py(90)response_for_exception()\n-> response = handle_uncaught_exception(request, get_resolver(get_urlconf()), sys.exc_info())\n[24]   …/Vcs/django/django/core/handlers/exception.py(125)handle_uncaught_exception()\n-> return debug.technical_500_response(request, *exc_info)\n[25]   …/Vcs/django/django/views/debug.py(94)technical_500_response()\n-> html = reporter.get_traceback_html()\n[26]   …/Vcs/django/django/views/debug.py(333)get_traceback_html()\n-> c = Context(self.get_traceback_data(), use_l10n=False)\n[27]   …/Vcs/django/django/views/debug.py(264)get_traceback_data()\n-> frames = self.get_traceback_frames()\n[28]   …/Vcs/django/django/views/debug.py(427)get_traceback_frames()\n-> filename, lineno, 7, loader, module_name,\n\n 385             try:\n 386                 context_line = source[lineno]\n 387             except:\n 388                 __import__('pdb').set_trace()\n 389  ->         post_context = source[lineno + 1:upper_bound]\n 390\n 391             return lower_bound, pre_context, context_line, post_context\n(Pdb++) source\n['# this file is needed to hijack pdb without eggs', 'import os.path', \"pdb_path = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'pdb.py')\", 'with open(pdb_path) as f:', \"    exec(compile(f.read(), pdb_path, 'exec'))\"]\nIt uses the loader (\n​\nhttps://github.com/django/django/blob/47885278c669dd7a13a4c3ff7e58e1cbe88af385/django/views/debug.py#L351\n), which picks up the\npth\n, and then the contents does not match the expected line number.\nI think it should maybe always use the given filename?!",
      "issue_closed_at": "2019-11-12T04:53:04",
      "base_commit": "6e2f05b2e33a6c80c7a411ce76af7b5a08acb835",
      "changes": [
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "get_traceback_text",
          "class_name": "ExceptionReporter",
          "code": "def get_traceback_text(self):\n        \"\"\"Return plain text version of debug 500 HTTP error page.\"\"\"\n        with Path(CURRENT_DIR, 'templates', 'technical_500.txt').open(encoding='utf-8') as fh:\n            t = DEBUG_ENGINE.from_string(fh.read())\n        c = Context(self.get_traceback_data(), autoescape=False, use_l10n=False)\n        return t.render(c)"
        },
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "_get_lines_from_file",
          "class_name": "ExceptionReporter",
          "code": "def _get_lines_from_file(self, filename, lineno, context_lines, loader=None, module_name=None):\n        \"\"\"\n        Return context_lines before and after lineno from file.\n        Return (pre_context_lineno, pre_context, context_line, post_context).\n        \"\"\"\n        source = None\n        if hasattr(loader, 'get_source'):\n            try:\n                source = loader.get_source(module_name)\n            except ImportError:\n                pass\n            if source is not None:\n                source = source.splitlines()\n        if source is None:\n            try:\n                with open(filename, 'rb') as fp:\n                    source = fp.read().splitlines()\n            except OSError:\n                pass\n        if source is None:\n            return None, [], None, []\n\n        # If we just read the source from a file, or if the loader did not\n        # apply tokenize.detect_encoding to decode the source into a\n        # string, then we should do that ourselves.\n        if isinstance(source[0], bytes):\n            encoding = 'ascii'\n            for line in source[:2]:\n                # File coding may be specified. Match pattern from PEP-263\n                # (https://www.python.org/dev/peps/pep-0263/)\n                match = re.search(br'coding[:=]\\s*([-\\w.]+)', line)\n                if match:\n                    encoding = match.group(1).decode('ascii')\n                    break\n            source = [str(sline, encoding, 'replace') for sline in source]\n\n        lower_bound = max(0, lineno - context_lines)\n        upper_bound = lineno + context_lines\n\n        pre_context = source[lower_bound:lineno]\n        context_line = source[lineno]\n        post_context = source[lineno + 1:upper_bound]\n\n        return lower_bound, pre_context, context_line, post_context"
        },
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "_get_lines_from_file",
          "class_name": "ExceptionReporter",
          "code": "def _get_lines_from_file(self, filename, lineno, context_lines, loader=None, module_name=None):\n        \"\"\"\n        Return context_lines before and after lineno from file.\n        Return (pre_context_lineno, pre_context, context_line, post_context).\n        \"\"\"\n        source = None\n        if hasattr(loader, 'get_source'):\n            try:\n                source = loader.get_source(module_name)\n            except ImportError:\n                pass\n            if source is not None:\n                source = source.splitlines()\n        if source is None:\n            try:\n                with open(filename, 'rb') as fp:\n                    source = fp.read().splitlines()\n            except OSError:\n                pass\n        if source is None:\n            return None, [], None, []\n\n        # If we just read the source from a file, or if the loader did not\n        # apply tokenize.detect_encoding to decode the source into a\n        # string, then we should do that ourselves.\n        if isinstance(source[0], bytes):\n            encoding = 'ascii'\n            for line in source[:2]:\n                # File coding may be specified. Match pattern from PEP-263\n                # (https://www.python.org/dev/peps/pep-0263/)\n                match = re.search(br'coding[:=]\\s*([-\\w.]+)', line)\n                if match:\n                    encoding = match.group(1).decode('ascii')\n                    break\n            source = [str(sline, encoding, 'replace') for sline in source]\n\n        lower_bound = max(0, lineno - context_lines)\n        upper_bound = lineno + context_lines\n\n        pre_context = source[lower_bound:lineno]\n        context_line = source[lineno]\n        post_context = source[lineno + 1:upper_bound]\n\n        return lower_bound, pre_context, context_line, post_context"
        }
      ]
    },
    {
      "pr_number": 10260,
      "pr_title": "Fixed #29613 -- Fixed --keepdb on PostgreSQL if the database exists and the user can't create databases.",
      "pr_body": "Ticket [29613](https://code.djangoproject.com/ticket/29613).",
      "issue_id": 29613,
      "issue_title": "Allow --keepdb to work on PostgreSQL if the database exists but the user can't create databases",
      "issue_body": "The popular Web Faction hosting service uses a shared database server. Users can create databases using the web UI or XML RPC calls, but not using the SQL CREATE syntax.\nRunning tests throws a ProgrammingError, with the message 'permission denied to create database', even if the test database has been previously created manually.\nThe error code for this error is '42501', which appears to correspond to errorcodes.INSUFFICIENT_PRIVILEGE.\ndjango/db/backends/postgresql/creation.py only handles the error errorcodes.DUPLICATE_DATABASE in _execute_create_test_db(), line 35. Because the error code does not match the program exits with a log message. But it would be fine to proceed with the error code '42501' also, making use of the --keepdb mechanism.\nThis appears to be a regression, as I did not experience this issue either using postgresql_psycopg2 driver or using Django 1.11",
      "issue_closed_at": "2018-08-03T03:32:30",
      "base_commit": "d8e2be459f97f1773c7edf7d37de180139146176",
      "changes": [
        {
          "file": "django/db/backends/postgresql/creation.py",
          "type": "line",
          "name": "line 3",
          "code": "from psycopg2 import errorcodes\n\nfrom django.db.backends.base.creation import BaseDatabaseCreation\n\n\nclass DatabaseCreation(BaseDatabaseCreation):"
        },
        {
          "file": "django/db/backends/postgresql/creation.py",
          "type": "function",
          "name": "sql_table_creation_suffix",
          "class_name": "DatabaseCreation",
          "code": "def sql_table_creation_suffix(self):\n        test_settings = self.connection.settings_dict['TEST']\n        assert test_settings['COLLATION'] is None, (\n            \"PostgreSQL does not support collation setting at database creation time.\"\n        )\n        return self._get_database_create_suffix(\n            encoding=test_settings['CHARSET'],\n            template=test_settings.get('TEMPLATE'),\n        )"
        }
      ]
    },
    {
      "pr_number": 14578,
      "pr_title": "Fixed #32144 -- Made makemessages remove temporary files when locale path doesn't exist.",
      "pr_body": "Alternative to  #13609 ticket-32144",
      "issue_id": 32144,
      "issue_title": "makemessages leaves temporary files when locale directory doesn't exist.",
      "issue_body": "If you run makemessages and you end up with the error message \"Unable to find a locale path to store translations for file [...]\", you get a lot of temporary files left over that you need to clean up.\nThe fix is pretty trivial so a PR is on the way.",
      "issue_closed_at": "2021-07-01T03:11:23",
      "base_commit": "62988afbea7c7ea6ea7eb76382b3a87a5ccf310c",
      "changes": [
        {
          "file": "django/core/management/commands/makemessages.py",
          "type": "function",
          "name": "process_locale_dir",
          "class_name": "Command",
          "code": "def process_locale_dir(self, locale_dir, files):\n        \"\"\"\n        Extract translatable literals from the specified files, creating or\n        updating the POT file for a given locale directory.\n\n        Use the xgettext GNU gettext utility.\n        \"\"\"\n        build_files = []\n        for translatable in files:\n            if self.verbosity > 1:\n                self.stdout.write('processing file %s in %s' % (\n                    translatable.file, translatable.dirpath\n                ))\n            if self.domain not in ('djangojs', 'django'):\n                continue\n            build_file = self.build_file_class(self, self.domain, translatable)\n            try:\n                build_file.preprocess()\n            except UnicodeDecodeError as e:\n                self.stdout.write(\n                    'UnicodeDecodeError: skipped file %s in %s (reason: %s)' % (\n                        translatable.file, translatable.dirpath, e,\n                    )\n                )\n                continue\n            build_files.append(build_file)\n\n        if self.domain == 'djangojs':\n            is_templatized = build_file.is_templatized\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=%s' % ('C' if is_templatized else 'JavaScript',),\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--output=-',\n            ]\n        elif self.domain == 'django':\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=Python',\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--keyword=pgettext_lazy:1c,2',\n                '--keyword=npgettext_lazy:1c,2,3',\n                '--output=-',\n            ]\n        else:\n            return\n\n        input_files = [bf.work_path for bf in build_files]\n        with NamedTemporaryFile(mode='w+') as input_files_list:\n            input_files_list.write('\\n'.join(input_files))\n            input_files_list.flush()\n            args.extend(['--files-from', input_files_list.name])\n            args.extend(self.xgettext_options)\n            msgs, errors, status = popen_wrapper(args)\n\n        if errors:\n            if status != STATUS_OK:\n                for build_file in build_files:\n                    build_file.cleanup()\n                raise CommandError(\n                    'errors happened while running xgettext on %s\\n%s' %\n                    ('\\n'.join(input_files), errors)\n                )\n            elif self.verbosity > 0:\n                # Print warnings\n                self.stdout.write(errors)\n\n        if msgs:\n            if locale_dir is NO_LOCALE_DIR:\n                file_path = os.path.normpath(build_files[0].path)\n                raise CommandError(\n                    \"Unable to find a locale path to store translations for \"\n                    \"file %s. Make sure the 'locale' directory exists in an \"\n                    \"app or LOCALE_PATHS setting is set.\" % file_path\n                )\n            for build_file in build_files:\n                msgs = build_file.postprocess_messages(msgs)\n            potfile = os.path.join(locale_dir, '%s.pot' % self.domain)\n            write_pot_file(potfile, msgs)\n\n        for build_file in build_files:\n            build_file.cleanup()"
        },
        {
          "file": "django/core/management/commands/makemessages.py",
          "type": "function",
          "name": "process_locale_dir",
          "class_name": "Command",
          "code": "def process_locale_dir(self, locale_dir, files):\n        \"\"\"\n        Extract translatable literals from the specified files, creating or\n        updating the POT file for a given locale directory.\n\n        Use the xgettext GNU gettext utility.\n        \"\"\"\n        build_files = []\n        for translatable in files:\n            if self.verbosity > 1:\n                self.stdout.write('processing file %s in %s' % (\n                    translatable.file, translatable.dirpath\n                ))\n            if self.domain not in ('djangojs', 'django'):\n                continue\n            build_file = self.build_file_class(self, self.domain, translatable)\n            try:\n                build_file.preprocess()\n            except UnicodeDecodeError as e:\n                self.stdout.write(\n                    'UnicodeDecodeError: skipped file %s in %s (reason: %s)' % (\n                        translatable.file, translatable.dirpath, e,\n                    )\n                )\n                continue\n            build_files.append(build_file)\n\n        if self.domain == 'djangojs':\n            is_templatized = build_file.is_templatized\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=%s' % ('C' if is_templatized else 'JavaScript',),\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--output=-',\n            ]\n        elif self.domain == 'django':\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=Python',\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--keyword=pgettext_lazy:1c,2',\n                '--keyword=npgettext_lazy:1c,2,3',\n                '--output=-',\n            ]\n        else:\n            return\n\n        input_files = [bf.work_path for bf in build_files]\n        with NamedTemporaryFile(mode='w+') as input_files_list:\n            input_files_list.write('\\n'.join(input_files))\n            input_files_list.flush()\n            args.extend(['--files-from', input_files_list.name])\n            args.extend(self.xgettext_options)\n            msgs, errors, status = popen_wrapper(args)\n\n        if errors:\n            if status != STATUS_OK:\n                for build_file in build_files:\n                    build_file.cleanup()\n                raise CommandError(\n                    'errors happened while running xgettext on %s\\n%s' %\n                    ('\\n'.join(input_files), errors)\n                )\n            elif self.verbosity > 0:\n                # Print warnings\n                self.stdout.write(errors)\n\n        if msgs:\n            if locale_dir is NO_LOCALE_DIR:\n                file_path = os.path.normpath(build_files[0].path)\n                raise CommandError(\n                    \"Unable to find a locale path to store translations for \"\n                    \"file %s. Make sure the 'locale' directory exists in an \"\n                    \"app or LOCALE_PATHS setting is set.\" % file_path\n                )\n            for build_file in build_files:\n                msgs = build_file.postprocess_messages(msgs)\n            potfile = os.path.join(locale_dir, '%s.pot' % self.domain)\n            write_pot_file(potfile, msgs)\n\n        for build_file in build_files:\n            build_file.cleanup()"
        }
      ]
    },
    {
      "pr_number": 8228,
      "pr_title": "Fixed #27966 -- Bumped required psycopg2 version to 2.5.4.",
      "pr_body": "",
      "issue_id": 27966,
      "issue_title": "Bump required version of pyscopg2 to 2.5.4",
      "issue_body": "​\nthis commit\nuses the cursor as context manager (line in question is marked), which were added in psycopg2 2.5 (\n​\nrelease notes\n) (see third item)\nbut\n​\nhere\ndjango checks only for 2.4.5.\n​\nthis commit here\nmade 2.4.5 a requirement and documented that in a few places.",
      "issue_closed_at": "2017-03-21T11:23:31",
      "base_commit": "7063a85579f40585f2601ba6e6887b0982e7ce43",
      "changes": [
        {
          "file": "django/db/backends/postgresql/base.py",
          "type": "function",
          "name": "psycopg2_version",
          "class_name": "DatabaseWrapper",
          "code": "def psycopg2_version(self):\n        return PSYCOPG2_VERSION"
        }
      ]
    },
    {
      "pr_number": 4114,
      "pr_title": "Fixed #24319 -- Added validation for UUID model field",
      "pr_body": "",
      "issue_id": 24319,
      "issue_title": "UUIDField do not properly clean (validate) value in get_db_prep_value",
      "issue_body": "Use case\n: Using user's input to retrieve a model from database.\nIssue\n: The UUIDField doesn't properly *clean* the input value, meaning the ORM will query the database even the query values aren't cleaned.\nSystem\n: Ubuntu 14.04 LTS + PostgresSQL 9.3\nGood\n: User.objects.get(pk='ssss') -> ValueError\nBad\n: Media.objects.get(pk='ssss') -> DataError\nclass Media(models.Model):\n    pk = models.UUIDField()\n>>> User.objects.get(pk='ssss')\nTraceback (most recent call last):\n  File \"<input>\", line 1, in <module>\n  File \"venv/src/django/django/db/models/manager.py\", line 127, in manager_method\n    return getattr(self.get_queryset(), name)(*args, **kwargs)\n  File \"venv/src/django/django/db/models/query.py\", line 320, in get\n    clone = self.filter(*args, **kwargs)\n  File \"venv/src/django/django/db/models/query.py\", line 671, in filter\n    return self._filter_or_exclude(False, *args, **kwargs)\n  File \"venv/src/django/django/db/models/query.py\", line 689, in _filter_or_exclude\n    clone.query.add_q(Q(*args, **kwargs))\n  File \"venv/src/django/django/db/models/sql/query.py\", line 1284, in add_q\n    clause, require_inner = self._add_q(where_part, self.used_aliases)\n  File \"venv/src/django/django/db/models/sql/query.py\", line 1311, in _add_q\n    current_negated=current_negated, connector=connector, allow_joins=allow_joins)\n  File \"venv/src/django/django/db/models/sql/query.py\", line 1183, in build_filter\n    condition = self.build_lookup(lookups, col, value)\n  File \"venv/src/django/django/db/models/sql/query.py\", line 1079, in build_lookup\n    return final_lookup(lhs, rhs)\n  File \"venv/src/django/django/db/models/lookups.py\", line 96, in __init__\n    self.rhs = self.get_prep_lookup()\n  File \"venv/src/django/django/db/models/lookups.py\", line 134, in get_prep_lookup\n    return self.lhs.output_field.get_prep_lookup(self.lookup_name, self.rhs)\n  File \"venv/src/django/django/db/models/fields/__init__.py\", line 716, in get_prep_lookup\n    return self.get_prep_value(value)\n  File \"venv/src/django/django/db/models/fields/__init__.py\", line 974, in get_prep_value\n    return int(value)\nValueError: invalid literal for int() with base 10: 'ssss'\n>>> Media.objects.get(pk='ssss')\nTraceback (most recent call last):\n  File \"<input>\", line 1, in <module>\n  File \"venv/src/django/django/db/models/manager.py\", line 127, in manager_method\n    return getattr(self.get_queryset(), name)(*args, **kwargs)\n  File \"venv/src/django/django/db/models/query.py\", line 326, in get\n    num = len(clone)\n  File \"venv/src/django/django/db/models/query.py\", line 145, in __len__\n    self._fetch_all()\n  File \"venv/src/django/django/db/models/query.py\", line 955, in _fetch_all\n    self._result_cache = list(self.iterator())\n  File \"venv/src/django/django/db/models/query.py\", line 239, in iterator\n    results = compiler.execute_sql()\n  File \"venv/src/django/django/db/models/sql/compiler.py\", line 826, in execute_sql\n    cursor.execute(sql, params)\n  File \"venv/src/django/django/db/backends/utils.py\", line 80, in execute\n    return super(CursorDebugWrapper, self).execute(sql, params)\n  File \"venv/src/django/django/db/backends/utils.py\", line 65, in execute\n    return self.cursor.execute(sql, params)\n  File \"venv/src/django/django/db/utils.py\", line 95, in __exit__\n    six.reraise(dj_exc_type, dj_exc_value, traceback)\n  File \"venv/src/django/django/utils/six.py\", line 658, in reraise\n    raise value.with_traceback(tb)\n  File \"venv/src/django/django/db/backends/utils.py\", line 65, in execute\n    return self.cursor.execute(sql, params)\ndjango.db.utils.DataError: invalid input syntax for uuid: \"ssss\"\nLINE 1: ...oudncode_media\" WHERE \"cloudncode_media\".\"uuid\" = 'ssss' LIM...",
      "issue_closed_at": "2015-02-12T16:58:19",
      "base_commit": "d64baaef3b95abe9ae5d07317c9bf4df02cb8592",
      "changes": [
        {
          "file": "django/db/models/fields/__init__.py",
          "type": "function",
          "name": "get_internal_type",
          "class_name": "UUIDField",
          "code": "def get_internal_type(self):\n        return \"UUIDField\""
        }
      ]
    }
  ]
}