{
  "Selected_candidate": {
    "pr_number": 11263,
    "pr_title": "Fixed #30361 -- Increased the default timeout of watchman client to 5 seconds and made it customizable.",
    "pr_body": "",
    "issue_id": 30361,
    "issue_title": "Watchman timing out when loading server",
    "issue_body": "When starting the server on my project using\n./manage.py runserver\n, I get the error message:\nError connecting to Watchman: timed out waiting for response, while executing ('watch-project', 'my_app')\nI am using Watchman v4.9 on an Ubuntu 16.04 Docker image hosted on Mac OS X 10.14.4.\nMy research shows that there is a default 1 second timeout in\npywatchman\nthat Django is using. In my tests, for our particular project it takes between 1 and 2 seconds to start the initial root watchman query, and thus will always time out when started with Django.\nMy suggestion is that we increase the pywatchman client timeout higher than 1 second",
    "issue_closed_at": "2019-04-26T06:35:55",
    "base_commit": "efeceba589974b95b35b2e25df86498c96315518",
    "changes": [
      {
        "file": "django/utils/autoreload.py",
        "type": "class",
        "name": "WatchmanReloader",
        "code": "class WatchmanReloader(BaseReloader):\n    def __init__(self):\n        self.roots = defaultdict(set)\n        self.processed_request = threading.Event()\n        super().__init__()\n\n    @cached_property\n    def client(self):\n        return pywatchman.client()\n\n    def _watch_root(self, root):\n        # In practice this shouldn't occur, however, it's possible that a\n        # directory that doesn't exist yet is being watched. If it's outside of\n        # sys.path then this will end up a new root. How to handle this isn't\n        # clear: Not adding the root will likely break when subscribing to the\n        # changes, however, as this is currently an internal API,  no files\n        # will be being watched outside of sys.path. Fixing this by checking\n        # inside watch_glob() and watch_dir() is expensive, instead this could\n        # could fall back to the StatReloader if this case is detected? For\n        # now, watching its parent, if possible, is sufficient.\n        if not root.exists():\n            if not root.parent.exists():\n                logger.warning('Unable to watch root dir %s as neither it or its parent exist.', root)\n                return\n            root = root.parent\n        result = self.client.query('watch-project', str(root.absolute()))\n        if 'warning' in result:\n            logger.warning('Watchman warning: %s', result['warning'])\n        logger.debug('Watchman watch-project result: %s', result)\n        return result['watch'], result.get('relative_path')\n\n    @functools.lru_cache()\n    def _get_clock(self, root):\n        return self.client.query('clock', root)['clock']\n\n    def _subscribe(self, directory, name, expression):\n        root, rel_path = self._watch_root(directory)\n        query = {\n            'expression': expression,\n            'fields': ['name'],\n            'since': self._get_clock(root),\n            'dedup_results': True,\n        }\n        if rel_path:\n            query['relative_root'] = rel_path\n        logger.debug('Issuing watchman subscription %s, for root %s. Query: %s', name, root, query)\n        self.client.query('subscribe', root, name, query)\n\n    def _subscribe_dir(self, directory, filenames):\n        if not directory.exists():\n            if not directory.parent.exists():\n                logger.warning('Unable to watch directory %s as neither it or its parent exist.', directory)\n                return\n            prefix = 'files-parent-%s' % directory.name\n            filenames = ['%s/%s' % (directory.name, filename) for filename in filenames]\n            directory = directory.parent\n            expression = ['name', filenames, 'wholename']\n        else:\n            prefix = 'files'\n            expression = ['name', filenames]\n        self._subscribe(directory, '%s:%s' % (prefix, directory), expression)\n\n    def _watch_glob(self, directory, patterns):\n        \"\"\"\n        Watch a directory with a specific glob. If the directory doesn't yet\n        exist, attempt to watch the parent directory and amend the patterns to\n        include this. It's important this method isn't called more than one per\n        directory when updating all subscriptions. Subsequent calls will\n        overwrite the named subscription, so it must include all possible glob\n        expressions.\n        \"\"\"\n        prefix = 'glob'\n        if not directory.exists():\n            if not directory.parent.exists():\n                logger.warning('Unable to watch directory %s as neither it or its parent exist.', directory)\n                return\n            prefix = 'glob-parent-%s' % directory.name\n            patterns = ['%s/%s' % (directory.name, pattern) for pattern in patterns]\n            directory = directory.parent\n\n        expression = ['anyof']\n        for pattern in patterns:\n            expression.append(['match', pattern, 'wholename'])\n        self._subscribe(directory, '%s:%s' % (prefix, directory), expression)\n\n    def watched_roots(self, watched_files):\n        extra_directories = self.directory_globs.keys()\n        watched_file_dirs = [f.parent for f in watched_files]\n        sys_paths = list(sys_path_directories())\n        return frozenset((*extra_directories, *watched_file_dirs, *sys_paths))\n\n    def _update_watches(self):\n        watched_files = list(self.watched_files(include_globs=False))\n        found_roots = common_roots(self.watched_roots(watched_files))\n        logger.debug('Watching %s files', len(watched_files))\n        logger.debug('Found common roots: %s', found_roots)\n        # Setup initial roots for performance, shortest roots first.\n        for root in sorted(found_roots):\n            self._watch_root(root)\n        for directory, patterns in self.directory_globs.items():\n            self._watch_glob(directory, patterns)\n        # Group sorted watched_files by their parent directory.\n        sorted_files = sorted(watched_files, key=lambda p: p.parent)\n        for directory, group in itertools.groupby(sorted_files, key=lambda p: p.parent):\n            # These paths need to be relative to the parent directory.\n            self._subscribe_dir(directory, [str(p.relative_to(directory)) for p in group])\n\n    def update_watches(self):\n        try:\n            self._update_watches()\n        except Exception as ex:\n            # If the service is still available, raise the original exception.\n            if self.check_server_status(ex):\n                raise\n\n    def _check_subscription(self, sub):\n        subscription = self.client.getSubscription(sub)\n        if not subscription:\n            return\n        logger.debug('Watchman subscription %s has results.', sub)\n        for result in subscription:\n            # When using watch-project, it's not simple to get the relative\n            # directory without storing some specific state. Store the full\n            # path to the directory in the subscription name, prefixed by its\n            # type (glob, files).\n            root_directory = Path(result['subscription'].split(':', 1)[1])\n            logger.debug('Found root directory %s', root_directory)\n            for file in result.get('files', []):\n                self.notify_file_changed(root_directory / file)\n\n    def request_processed(self, **kwargs):\n        logger.debug('Request processed. Setting update_watches event.')\n        self.processed_request.set()\n\n    def tick(self):\n        request_finished.connect(self.request_processed)\n        self.update_watches()\n        while True:\n            if self.processed_request.is_set():\n                self.update_watches()\n                self.processed_request.clear()\n            try:\n                self.client.receive()\n            except pywatchman.WatchmanError as ex:\n                self.check_server_status(ex)\n            else:\n                for sub in list(self.client.subs.keys()):\n                    self._check_subscription(sub)\n            yield\n\n    def stop(self):\n        self.client.close()\n        super().stop()\n\n    def check_server_status(self, inner_ex=None):\n        \"\"\"Return True if the server is available.\"\"\"\n        try:\n            self.client.query('version')\n        except Exception:\n            raise WatchmanUnavailable(str(inner_ex)) from inner_ex\n        return True\n\n    @classmethod\n    def check_availability(cls):\n        if not pywatchman:\n            raise WatchmanUnavailable('pywatchman not installed.')\n        client = pywatchman.client(timeout=0.01)\n        try:\n            result = client.capabilityCheck()\n        except Exception:\n            # The service is down?\n            raise WatchmanUnavailable('Cannot connect to the watchman service.')\n        version = get_version_tuple(result['version'])\n        # Watchman 4.9 includes multiple improvements to watching project\n        # directories as well as case insensitive filesystems.\n        logger.debug('Watchman version %s', version)\n        if version < (4, 9):\n            raise WatchmanUnavailable('Watchman 4.9 or later is required.')"
      },
      {
        "file": "django/utils/autoreload.py",
        "type": "function",
        "name": "check_server_status",
        "class_name": "WatchmanReloader",
        "code": "def check_server_status(self, inner_ex=None):\n        \"\"\"Return True if the server is available.\"\"\"\n        try:\n            self.client.query('version')\n        except Exception:\n            raise WatchmanUnavailable(str(inner_ex)) from inner_ex\n        return True"
      }
    ]
  },
  "Justification": "Candidate E is the most relevant to the CURRENT bug report because it directly relates to the autoreloading functionality of Django when running a server with manage.py. The problem described in Candidate E involves a timeout issue with the watchman, which is a similar mechanism that relates to file tracking and changes, paralleling the CURRENT bug's issue of changes in manage.py not being detected. The changes made to the watchman timeout address a fundamental aspect of the autoreload process, potentially providing insights or analogs helpful in diagnosing why changes are not triggering the expected reload behavior. Moreover, both bugs involve Django's management command execution, making Candidate E particularly pertinent.",
  "instance_id": "django__django-11422",
  "repo": "django/django",
  "created_at": "2019-05-27T19:15:21Z",
  "problem_statement": "Autoreloader with StatReloader doesn't track changes in manage.py.\nDescription\n\t \n\t\t(last modified by Mariusz Felisiak)\n\t \nThis is a bit convoluted, but here we go.\nEnvironment (OSX 10.11):\n$ python -V\nPython 3.6.2\n$ pip -V\npip 19.1.1\n$ pip install Django==2.2.1\nSteps to reproduce:\nRun a server python manage.py runserver\nEdit the manage.py file, e.g. add print(): \ndef main():\n\tprint('sth')\n\tos.environ.setdefault('DJANGO_SETTINGS_MODULE', 'ticket_30479.settings')\n\t...\nUnder 2.1.8 (and prior), this will trigger the auto-reloading mechanism. Under 2.2.1, it won't. As far as I can tell from the django.utils.autoreload log lines, it never sees the manage.py itself.\n",
  "patch": "diff --git a/django/utils/autoreload.py b/django/utils/autoreload.py\n--- a/django/utils/autoreload.py\n+++ b/django/utils/autoreload.py\n@@ -114,7 +114,15 @@ def iter_modules_and_files(modules, extra_files):\n         # During debugging (with PyDev) the 'typing.io' and 'typing.re' objects\n         # are added to sys.modules, however they are types not modules and so\n         # cause issues here.\n-        if not isinstance(module, ModuleType) or getattr(module, '__spec__', None) is None:\n+        if not isinstance(module, ModuleType):\n+            continue\n+        if module.__name__ == '__main__':\n+            # __main__ (usually manage.py) doesn't always have a __spec__ set.\n+            # Handle this by falling back to using __file__, resolved below.\n+            # See https://docs.python.org/reference/import.html#main-spec\n+            sys_file_paths.append(module.__file__)\n+            continue\n+        if getattr(module, '__spec__', None) is None:\n             continue\n         spec = module.__spec__\n         # Modules could be loaded from places without a concrete location. If\n"
}