{
  "instance_id": "django__django-15202",
  "repo": "django/django",
  "created_at": "2021-12-15T15:04:13Z",
  "problem_statement": "URLField throws ValueError instead of ValidationError on clean\nDescription\n\t\nforms.URLField( ).clean('////]@N.AN')\nresults in:\n\tValueError: Invalid IPv6 URL\n\tTraceback (most recent call last):\n\t File \"basic_fuzzer.py\", line 22, in TestOneInput\n\t File \"fuzzers.py\", line 350, in test_forms_URLField\n\t File \"django/forms/fields.py\", line 151, in clean\n\t File \"django/forms/fields.py\", line 136, in run_validators\n\t File \"django/core/validators.py\", line 130, in __call__\n\t File \"urllib/parse.py\", line 440, in urlsplit\n",
  "patch": "diff --git a/django/core/validators.py b/django/core/validators.py\n--- a/django/core/validators.py\n+++ b/django/core/validators.py\n@@ -108,15 +108,16 @@ def __call__(self, value):\n             raise ValidationError(self.message, code=self.code, params={'value': value})\n \n         # Then check full URL\n+        try:\n+            splitted_url = urlsplit(value)\n+        except ValueError:\n+            raise ValidationError(self.message, code=self.code, params={'value': value})\n         try:\n             super().__call__(value)\n         except ValidationError as e:\n             # Trivial case failed. Try for possible IDN domain\n             if value:\n-                try:\n-                    scheme, netloc, path, query, fragment = urlsplit(value)\n-                except ValueError:  # for example, \"Invalid IPv6 URL\"\n-                    raise ValidationError(self.message, code=self.code, params={'value': value})\n+                scheme, netloc, path, query, fragment = splitted_url\n                 try:\n                     netloc = punycode(netloc)  # IDN -> ACE\n                 except UnicodeError:  # invalid domain part\n@@ -127,7 +128,7 @@ def __call__(self, value):\n                 raise\n         else:\n             # Now verify IPv6 in the netloc part\n-            host_match = re.search(r'^\\[(.+)\\](?::\\d{1,5})?$', urlsplit(value).netloc)\n+            host_match = re.search(r'^\\[(.+)\\](?::\\d{1,5})?$', splitted_url.netloc)\n             if host_match:\n                 potential_ip = host_match[1]\n                 try:\n@@ -139,7 +140,7 @@ def __call__(self, value):\n         # section 3.1. It's defined to be 255 bytes or less, but this includes\n         # one byte for the length of the name and one byte for the trailing dot\n         # that's used to indicate absolute names in DNS.\n-        if len(urlsplit(value).hostname) > 253:\n+        if splitted_url.hostname is None or len(splitted_url.hostname) > 253:\n             raise ValidationError(self.message, code=self.code, params={'value': value})\n \n \n",
  "similar_bug_items": [
    {
      "pr_number": 11886,
      "pr_title": "Fixed #30405 -- Fixed source code mismatch crash in ExceptionReporter. ",
      "pr_body": "[ticket 30405](https://code.djangoproject.com/ticket/30405)",
      "issue_id": 30405,
      "issue_title": "IndexError in _get_lines_from_file when module does not match file contents (via loader)",
      "issue_body": "",
      "issue_closed_at": "2019-11-12T04:53:04",
      "base_commit": "6e2f05b2e33a6c80c7a411ce76af7b5a08acb835",
      "changes": [
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "get_traceback_text",
          "class_name": "ExceptionReporter",
          "code": "def get_traceback_text(self):\n        \"\"\"Return plain text version of debug 500 HTTP error page.\"\"\"\n        with Path(CURRENT_DIR, 'templates', 'technical_500.txt').open(encoding='utf-8') as fh:\n            t = DEBUG_ENGINE.from_string(fh.read())\n        c = Context(self.get_traceback_data(), autoescape=False, use_l10n=False)\n        return t.render(c)"
        },
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "_get_lines_from_file",
          "class_name": "ExceptionReporter",
          "code": "def _get_lines_from_file(self, filename, lineno, context_lines, loader=None, module_name=None):\n        \"\"\"\n        Return context_lines before and after lineno from file.\n        Return (pre_context_lineno, pre_context, context_line, post_context).\n        \"\"\"\n        source = None\n        if hasattr(loader, 'get_source'):\n            try:\n                source = loader.get_source(module_name)\n            except ImportError:\n                pass\n            if source is not None:\n                source = source.splitlines()\n        if source is None:\n            try:\n                with open(filename, 'rb') as fp:\n                    source = fp.read().splitlines()\n            except OSError:\n                pass\n        if source is None:\n            return None, [], None, []\n\n        # If we just read the source from a file, or if the loader did not\n        # apply tokenize.detect_encoding to decode the source into a\n        # string, then we should do that ourselves.\n        if isinstance(source[0], bytes):\n            encoding = 'ascii'\n            for line in source[:2]:\n                # File coding may be specified. Match pattern from PEP-263\n                # (https://www.python.org/dev/peps/pep-0263/)\n                match = re.search(br'coding[:=]\\s*([-\\w.]+)', line)\n                if match:\n                    encoding = match.group(1).decode('ascii')\n                    break\n            source = [str(sline, encoding, 'replace') for sline in source]\n\n        lower_bound = max(0, lineno - context_lines)\n        upper_bound = lineno + context_lines\n\n        pre_context = source[lower_bound:lineno]\n        context_line = source[lineno]\n        post_context = source[lineno + 1:upper_bound]\n\n        return lower_bound, pre_context, context_line, post_context"
        },
        {
          "file": "django/views/debug.py",
          "type": "function",
          "name": "_get_lines_from_file",
          "class_name": "ExceptionReporter",
          "code": "def _get_lines_from_file(self, filename, lineno, context_lines, loader=None, module_name=None):\n        \"\"\"\n        Return context_lines before and after lineno from file.\n        Return (pre_context_lineno, pre_context, context_line, post_context).\n        \"\"\"\n        source = None\n        if hasattr(loader, 'get_source'):\n            try:\n                source = loader.get_source(module_name)\n            except ImportError:\n                pass\n            if source is not None:\n                source = source.splitlines()\n        if source is None:\n            try:\n                with open(filename, 'rb') as fp:\n                    source = fp.read().splitlines()\n            except OSError:\n                pass\n        if source is None:\n            return None, [], None, []\n\n        # If we just read the source from a file, or if the loader did not\n        # apply tokenize.detect_encoding to decode the source into a\n        # string, then we should do that ourselves.\n        if isinstance(source[0], bytes):\n            encoding = 'ascii'\n            for line in source[:2]:\n                # File coding may be specified. Match pattern from PEP-263\n                # (https://www.python.org/dev/peps/pep-0263/)\n                match = re.search(br'coding[:=]\\s*([-\\w.]+)', line)\n                if match:\n                    encoding = match.group(1).decode('ascii')\n                    break\n            source = [str(sline, encoding, 'replace') for sline in source]\n\n        lower_bound = max(0, lineno - context_lines)\n        upper_bound = lineno + context_lines\n\n        pre_context = source[lower_bound:lineno]\n        context_line = source[lineno]\n        post_context = source[lineno + 1:upper_bound]\n\n        return lower_bound, pre_context, context_line, post_context"
        }
      ]
    },
    {
      "pr_number": 10260,
      "pr_title": "Fixed #29613 -- Fixed --keepdb on PostgreSQL if the database exists and the user can't create databases.",
      "pr_body": "Ticket [29613](https://code.djangoproject.com/ticket/29613).",
      "issue_id": 29613,
      "issue_title": "Allow --keepdb to work on PostgreSQL if the database exists but the user can't create databases",
      "issue_body": "",
      "issue_closed_at": "2018-08-03T03:32:30",
      "base_commit": "d8e2be459f97f1773c7edf7d37de180139146176",
      "changes": [
        {
          "file": "django/db/backends/postgresql/creation.py",
          "type": "line",
          "name": "line 3",
          "code": "from psycopg2 import errorcodes\n\nfrom django.db.backends.base.creation import BaseDatabaseCreation\n\n\nclass DatabaseCreation(BaseDatabaseCreation):"
        },
        {
          "file": "django/db/backends/postgresql/creation.py",
          "type": "function",
          "name": "sql_table_creation_suffix",
          "class_name": "DatabaseCreation",
          "code": "def sql_table_creation_suffix(self):\n        test_settings = self.connection.settings_dict['TEST']\n        assert test_settings['COLLATION'] is None, (\n            \"PostgreSQL does not support collation setting at database creation time.\"\n        )\n        return self._get_database_create_suffix(\n            encoding=test_settings['CHARSET'],\n            template=test_settings.get('TEMPLATE'),\n        )"
        }
      ]
    },
    {
      "pr_number": 14578,
      "pr_title": "Fixed #32144 -- Made makemessages remove temporary files when locale path doesn't exist.",
      "pr_body": "Alternative to  #13609 ticket-32144",
      "issue_id": 32144,
      "issue_title": "makemessages leaves temporary files when locale directory doesn't exist.",
      "issue_body": "",
      "issue_closed_at": "2021-07-01T03:11:23",
      "base_commit": "62988afbea7c7ea6ea7eb76382b3a87a5ccf310c",
      "changes": [
        {
          "file": "django/core/management/commands/makemessages.py",
          "type": "function",
          "name": "process_locale_dir",
          "class_name": "Command",
          "code": "def process_locale_dir(self, locale_dir, files):\n        \"\"\"\n        Extract translatable literals from the specified files, creating or\n        updating the POT file for a given locale directory.\n\n        Use the xgettext GNU gettext utility.\n        \"\"\"\n        build_files = []\n        for translatable in files:\n            if self.verbosity > 1:\n                self.stdout.write('processing file %s in %s' % (\n                    translatable.file, translatable.dirpath\n                ))\n            if self.domain not in ('djangojs', 'django'):\n                continue\n            build_file = self.build_file_class(self, self.domain, translatable)\n            try:\n                build_file.preprocess()\n            except UnicodeDecodeError as e:\n                self.stdout.write(\n                    'UnicodeDecodeError: skipped file %s in %s (reason: %s)' % (\n                        translatable.file, translatable.dirpath, e,\n                    )\n                )\n                continue\n            build_files.append(build_file)\n\n        if self.domain == 'djangojs':\n            is_templatized = build_file.is_templatized\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=%s' % ('C' if is_templatized else 'JavaScript',),\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--output=-',\n            ]\n        elif self.domain == 'django':\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=Python',\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--keyword=pgettext_lazy:1c,2',\n                '--keyword=npgettext_lazy:1c,2,3',\n                '--output=-',\n            ]\n        else:\n            return\n\n        input_files = [bf.work_path for bf in build_files]\n        with NamedTemporaryFile(mode='w+') as input_files_list:\n            input_files_list.write('\\n'.join(input_files))\n            input_files_list.flush()\n            args.extend(['--files-from', input_files_list.name])\n            args.extend(self.xgettext_options)\n            msgs, errors, status = popen_wrapper(args)\n\n        if errors:\n            if status != STATUS_OK:\n                for build_file in build_files:\n                    build_file.cleanup()\n                raise CommandError(\n                    'errors happened while running xgettext on %s\\n%s' %\n                    ('\\n'.join(input_files), errors)\n                )\n            elif self.verbosity > 0:\n                # Print warnings\n                self.stdout.write(errors)\n\n        if msgs:\n            if locale_dir is NO_LOCALE_DIR:\n                file_path = os.path.normpath(build_files[0].path)\n                raise CommandError(\n                    \"Unable to find a locale path to store translations for \"\n                    \"file %s. Make sure the 'locale' directory exists in an \"\n                    \"app or LOCALE_PATHS setting is set.\" % file_path\n                )\n            for build_file in build_files:\n                msgs = build_file.postprocess_messages(msgs)\n            potfile = os.path.join(locale_dir, '%s.pot' % self.domain)\n            write_pot_file(potfile, msgs)\n\n        for build_file in build_files:\n            build_file.cleanup()"
        },
        {
          "file": "django/core/management/commands/makemessages.py",
          "type": "function",
          "name": "process_locale_dir",
          "class_name": "Command",
          "code": "def process_locale_dir(self, locale_dir, files):\n        \"\"\"\n        Extract translatable literals from the specified files, creating or\n        updating the POT file for a given locale directory.\n\n        Use the xgettext GNU gettext utility.\n        \"\"\"\n        build_files = []\n        for translatable in files:\n            if self.verbosity > 1:\n                self.stdout.write('processing file %s in %s' % (\n                    translatable.file, translatable.dirpath\n                ))\n            if self.domain not in ('djangojs', 'django'):\n                continue\n            build_file = self.build_file_class(self, self.domain, translatable)\n            try:\n                build_file.preprocess()\n            except UnicodeDecodeError as e:\n                self.stdout.write(\n                    'UnicodeDecodeError: skipped file %s in %s (reason: %s)' % (\n                        translatable.file, translatable.dirpath, e,\n                    )\n                )\n                continue\n            build_files.append(build_file)\n\n        if self.domain == 'djangojs':\n            is_templatized = build_file.is_templatized\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=%s' % ('C' if is_templatized else 'JavaScript',),\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--output=-',\n            ]\n        elif self.domain == 'django':\n            args = [\n                'xgettext',\n                '-d', self.domain,\n                '--language=Python',\n                '--keyword=gettext_noop',\n                '--keyword=gettext_lazy',\n                '--keyword=ngettext_lazy:1,2',\n                '--keyword=pgettext:1c,2',\n                '--keyword=npgettext:1c,2,3',\n                '--keyword=pgettext_lazy:1c,2',\n                '--keyword=npgettext_lazy:1c,2,3',\n                '--output=-',\n            ]\n        else:\n            return\n\n        input_files = [bf.work_path for bf in build_files]\n        with NamedTemporaryFile(mode='w+') as input_files_list:\n            input_files_list.write('\\n'.join(input_files))\n            input_files_list.flush()\n            args.extend(['--files-from', input_files_list.name])\n            args.extend(self.xgettext_options)\n            msgs, errors, status = popen_wrapper(args)\n\n        if errors:\n            if status != STATUS_OK:\n                for build_file in build_files:\n                    build_file.cleanup()\n                raise CommandError(\n                    'errors happened while running xgettext on %s\\n%s' %\n                    ('\\n'.join(input_files), errors)\n                )\n            elif self.verbosity > 0:\n                # Print warnings\n                self.stdout.write(errors)\n\n        if msgs:\n            if locale_dir is NO_LOCALE_DIR:\n                file_path = os.path.normpath(build_files[0].path)\n                raise CommandError(\n                    \"Unable to find a locale path to store translations for \"\n                    \"file %s. Make sure the 'locale' directory exists in an \"\n                    \"app or LOCALE_PATHS setting is set.\" % file_path\n                )\n            for build_file in build_files:\n                msgs = build_file.postprocess_messages(msgs)\n            potfile = os.path.join(locale_dir, '%s.pot' % self.domain)\n            write_pot_file(potfile, msgs)\n\n        for build_file in build_files:\n            build_file.cleanup()"
        }
      ]
    },
    {
      "pr_number": 8228,
      "pr_title": "Fixed #27966 -- Bumped required psycopg2 version to 2.5.4.",
      "pr_body": "",
      "issue_id": 27966,
      "issue_title": "Bump required version of pyscopg2 to 2.5.4",
      "issue_body": "",
      "issue_closed_at": "2017-03-21T11:23:31",
      "base_commit": "7063a85579f40585f2601ba6e6887b0982e7ce43",
      "changes": [
        {
          "file": "django/db/backends/postgresql/base.py",
          "type": "function",
          "name": "psycopg2_version",
          "class_name": "DatabaseWrapper",
          "code": "def psycopg2_version(self):\n        return PSYCOPG2_VERSION"
        }
      ]
    },
    {
      "pr_number": 4114,
      "pr_title": "Fixed #24319 -- Added validation for UUID model field",
      "pr_body": "",
      "issue_id": 24319,
      "issue_title": "UUIDField do not properly clean (validate) value in get_db_prep_value",
      "issue_body": "",
      "issue_closed_at": "2015-02-12T16:58:19",
      "base_commit": "d64baaef3b95abe9ae5d07317c9bf4df02cb8592",
      "changes": [
        {
          "file": "django/db/models/fields/__init__.py",
          "type": "function",
          "name": "get_internal_type",
          "class_name": "UUIDField",
          "code": "def get_internal_type(self):\n        return \"UUIDField\""
        }
      ]
    }
  ]
}