{
  "Selected_candidate": {
    "pr_number": 7226,
    "pr_title": "Fix #7220: genindex: \"main\" index entries are not shown at first",
    "pr_body": "### Feature or Bugfix\r\n- Feature\r\n\r\n### Purpose\r\n- refs: #7220 ",
    "issue_id": 7220,
    "issue_title": "Make \"main\" index entries the first",
    "issue_body": "You can mark up “main” index entries by prefixing them with an exclamation mark. The references to “main” entries are emphasized in the generated index. But it does not change the order of entries, so the \"main\" index entry can be the last one.\r\n\r\nFor example, look at the index for \"import statement\" in the Python documentation. https://docs.python.org/3/genindex-I.html. There are 5 references. The last one is marked as \"main\".\r\n\r\nWould be nice if references to \"main\" entries be moved to the beginning of the list.\r\n\r\nThis issue was reported on the Python bug tracker: https://bugs.python.org/issue22714.",
    "issue_closed_at": "2020-02-29T17:14:20Z",
    "base_commit": "201455900a5fe938a1aadb4af37a2b13aeaa44bd",
    "changes": [
      {
        "file": "sphinx/environment/adapters/indexentries.py",
        "type": "line",
        "name": "line 7",
        "code": "    :copyright: Copyright 2007-2020 by the Sphinx team, see AUTHORS.\n    :license: BSD, see LICENSE for details.\n\"\"\"\nimport bisect\nimport re\nimport unicodedata\nfrom itertools import groupby"
      },
      {
        "file": "sphinx/environment/adapters/indexentries.py",
        "type": "function",
        "name": "add_entry",
        "class_name": "IndexEntries",
        "code": "def add_entry(word: str, subword: str, main: str, link: bool = True,\n                      dic: Dict = new, key: str = None) -> None:\n            # Force the word to be unicode if it's a ASCII bytestring.\n            # This will solve problems with unicode normalization later.\n            # For instance the RFC role will add bytestrings at the moment\n            word = str(word)\n            entry = dic.get(word)\n            if not entry:\n                dic[word] = entry = [[], {}, key]\n            if subword:\n                add_entry(subword, '', main, link=link, dic=entry[1], key=key)\n            elif link:\n                try:\n                    uri = builder.get_relative_uri('genindex', fn) + '#' + tid\n                except NoUri:\n                    pass\n                else:\n                    # maintain links in sorted/deterministic order\n                    bisect.insort(entry[0], (main, uri))"
      },
      {
        "file": "sphinx/environment/adapters/indexentries.py",
        "type": "function",
        "name": "add_entry",
        "class_name": "IndexEntries",
        "code": "def add_entry(word: str, subword: str, main: str, link: bool = True,\n                      dic: Dict = new, key: str = None) -> None:\n            # Force the word to be unicode if it's a ASCII bytestring.\n            # This will solve problems with unicode normalization later.\n            # For instance the RFC role will add bytestrings at the moment\n            word = str(word)\n            entry = dic.get(word)\n            if not entry:\n                dic[word] = entry = [[], {}, key]\n            if subword:\n                add_entry(subword, '', main, link=link, dic=entry[1], key=key)\n            elif link:\n                try:\n                    uri = builder.get_relative_uri('genindex', fn) + '#' + tid\n                except NoUri:\n                    pass\n                else:\n                    # maintain links in sorted/deterministic order\n                    bisect.insort(entry[0], (main, uri))"
      }
    ]
  },
  "Justification": "Candidate A is most helpful because it involves a bug related to the ordering of index entries, which is a similar structural issue to the problem of having two sections labeled \"Symbols\" in the CURRENT bug. Both involve manipulating how content is presented in the generated HTML output—a contextual relevance that aligns with the current bug's observable problem of duplicate section headers. Additionally, they both interact with the index management component of Sphinx's functionality, allowing insights into fixing structural errors in outputs that impact navigation. The potential to learn about content rendering mechanics from Candidate A provides a direct path toward addressing the CURRENT bug effectively.",
  "instance_id": "sphinx-doc__sphinx-7975",
  "repo": "sphinx-doc/sphinx",
  "created_at": "2020-07-18T06:39:32Z",
  "problem_statement": "Two sections called Symbols in index\nWhen using index entries with the following leading characters: _@_, _£_, and _←_ I get two sections called _Symbols_ in the HTML output, the first containing all _@_ entries before ”normal” words and the second containing _£_ and _←_ entries after the ”normal” words.  Both have the same anchor in HTML so the links at the top of the index page contain two _Symbols_ links, one before the letters and one after, but both lead to the first section.\n\n",
  "patch": "diff --git a/sphinx/environment/adapters/indexentries.py b/sphinx/environment/adapters/indexentries.py\n--- a/sphinx/environment/adapters/indexentries.py\n+++ b/sphinx/environment/adapters/indexentries.py\n@@ -98,9 +98,8 @@ def keyfunc0(entry: Tuple[str, str]) -> Tuple[bool, str]:\n             for subentry in indexentry[1].values():\n                 subentry[0].sort(key=keyfunc0)  # type: ignore\n \n-        # sort the index entries; put all symbols at the front, even those\n-        # following the letters in ASCII, this is where the chr(127) comes from\n-        def keyfunc(entry: Tuple[str, List]) -> Tuple[str, str]:\n+        # sort the index entries\n+        def keyfunc(entry: Tuple[str, List]) -> Tuple[Tuple[int, str], str]:\n             key, (void, void, category_key) = entry\n             if category_key:\n                 # using specified category key to sort\n@@ -108,11 +107,16 @@ def keyfunc(entry: Tuple[str, List]) -> Tuple[str, str]:\n             lckey = unicodedata.normalize('NFD', key.lower())\n             if lckey.startswith('\\N{RIGHT-TO-LEFT MARK}'):\n                 lckey = lckey[1:]\n+\n             if lckey[0:1].isalpha() or lckey.startswith('_'):\n-                lckey = chr(127) + lckey\n+                # put non-symbol characters at the folloing group (1)\n+                sortkey = (1, lckey)\n+            else:\n+                # put symbols at the front of the index (0)\n+                sortkey = (0, lckey)\n             # ensure a determinstic order *within* letters by also sorting on\n             # the entry itself\n-            return (lckey, entry[0])\n+            return (sortkey, entry[0])\n         newlist = sorted(new.items(), key=keyfunc)\n \n         if group_entries:\n"
}