{
  "instance_id": "mwaskom__seaborn-3190",
  "repo": "mwaskom/seaborn",
  "created_at": "2022-12-18T17:13:51Z",
  "problem_statement": "Color mapping fails with boolean data\n```python\r\nso.Plot([\"a\", \"b\"], [1, 2], color=[True, False]).add(so.Bar())\r\n```\r\n```python-traceback\r\n---------------------------------------------------------------------------\r\nTypeError                                 Traceback (most recent call last)\r\n...\r\nFile ~/code/seaborn/seaborn/_core/plot.py:841, in Plot._plot(self, pyplot)\r\n    838 plotter._compute_stats(self, layers)\r\n    840 # Process scale spec for semantic variables and coordinates computed by stat\r\n--> 841 plotter._setup_scales(self, common, layers)\r\n    843 # TODO Remove these after updating other methods\r\n    844 # ---- Maybe have debug= param that attaches these when True?\r\n    845 plotter._data = common\r\n\r\nFile ~/code/seaborn/seaborn/_core/plot.py:1252, in Plotter._setup_scales(self, p, common, layers, variables)\r\n   1250     self._scales[var] = Scale._identity()\r\n   1251 else:\r\n-> 1252     self._scales[var] = scale._setup(var_df[var], prop)\r\n   1254 # Everything below here applies only to coordinate variables\r\n   1255 # We additionally skip it when we're working with a value\r\n   1256 # that is derived from a coordinate we've already processed.\r\n   1257 # e.g., the Stat consumed y and added ymin/ymax. In that case,\r\n   1258 # we've already setup the y scale and ymin/max are in scale space.\r\n   1259 if axis is None or (var != coord and coord in p._variables):\r\n\r\nFile ~/code/seaborn/seaborn/_core/scales.py:351, in ContinuousBase._setup(self, data, prop, axis)\r\n    349 vmin, vmax = axis.convert_units((vmin, vmax))\r\n    350 a = forward(vmin)\r\n--> 351 b = forward(vmax) - forward(vmin)\r\n    353 def normalize(x):\r\n    354     return (x - a) / b\r\n\r\nTypeError: numpy boolean subtract, the `-` operator, is not supported, use the bitwise_xor, the `^` operator, or the logical_xor function instead.\r\n```\n",
  "patch": "diff --git a/seaborn/_core/scales.py b/seaborn/_core/scales.py\n--- a/seaborn/_core/scales.py\n+++ b/seaborn/_core/scales.py\n@@ -346,7 +346,7 @@ def _setup(\n                 vmin, vmax = data.min(), data.max()\n             else:\n                 vmin, vmax = new.norm\n-            vmin, vmax = axis.convert_units((vmin, vmax))\n+            vmin, vmax = map(float, axis.convert_units((vmin, vmax)))\n             a = forward(vmin)\n             b = forward(vmax) - forward(vmin)\n \n",
  "similar_bug_items": [
    {
      "pr_number": 2468,
      "pr_title": "Fix faceted bivariate histogram normalization at displot",
      "pr_body": "Fixes #2465",
      "issue_id": 2465,
      "issue_title": "bivariate displot with kind=\"hist\" ignores common_norm=False if hue is not assigned",
      "issue_body": "Somehow similar to #2377, but for `kind='hist'` and with `common_norm=False` being ignored.\r\n\r\nIf I understand it well, passing `common_norm=False` to `sns.distplot` should produce plots with independent \"z\" scale. While this is the behaviour for kde plots, it seems to be ignored for bivariate histograms unless hue is also specified.\r\n\r\nTest case:\r\n```python\r\nx, y = np.random.randn(2, 200)\r\nz = [0] * 150 + [1] * 50\r\nsns.displot(x=x, y=y, col=z, kind=\"hist\", cbar=True, common_norm=False)\r\nsns.displot(x=x, y=y, col=z, hue=z, kind=\"hist\", cbar=True, common_norm=False)\r\n```\r\n\r\nRunning seaborn version 0.11.1\r\n(I tried to look for other (open or closed) related issues, hope not duplicating them)",
      "issue_closed_at": "2021-02-05T01:20:16Z",
      "base_commit": "beb7f822895375143de396659cb562465ade25d7",
      "changes": [
        {
          "file": "seaborn/distributions.py",
          "type": "function",
          "name": "plot_bivariate_histogram",
          "class_name": "_DistributionPlotter",
          "code": "def plot_bivariate_histogram(\n        self,\n        common_bins, common_norm,\n        thresh, pthresh, pmax,\n        color, legend,\n        cbar, cbar_ax, cbar_kws,\n        estimate_kws,\n        **plot_kws,\n    ):\n\n        # Default keyword dicts\n        cbar_kws = {} if cbar_kws is None else cbar_kws.copy()\n\n        # Now initialize the Histogram estimator\n        estimator = Histogram(**estimate_kws)\n\n        # Do pre-compute housekeeping related to multiple groups\n        if set(self.variables) - {\"x\", \"y\"}:\n            all_data = self.comp_data.dropna()\n            if common_bins:\n                estimator.define_bin_edges(\n                    all_data[\"x\"],\n                    all_data[\"y\"],\n                    all_data.get(\"weights\", None),\n                )\n        else:\n            common_norm = False\n\n        # -- Determine colormap threshold and norm based on the full data\n\n        full_heights = []\n        for _, sub_data in self.iter_data(from_comp_data=True):\n            sub_heights, _ = estimator(\n                sub_data[\"x\"], sub_data[\"y\"], sub_data.get(\"weights\", None)\n            )\n            full_heights.append(sub_heights)\n\n        common_color_norm = \"hue\" not in self.variables or common_norm\n\n        if pthresh is not None and common_color_norm:\n            thresh = self._quantile_to_level(full_heights, pthresh)\n\n        plot_kws.setdefault(\"vmin\", 0)\n        if common_color_norm:\n            if pmax is not None:\n                vmax = self._quantile_to_level(full_heights, pmax)\n            else:\n                vmax = plot_kws.pop(\"vmax\", np.max(full_heights))\n        else:\n            vmax = None\n\n        # Get a default color\n        # (We won't follow the color cycle here, as multiple plots are unlikely)\n        if color is None:\n            color = \"C0\"\n\n        # --- Loop over data (subsets) and draw the histograms\n        for sub_vars, sub_data in self.iter_data(\"hue\", from_comp_data=True):\n\n            if sub_data.empty:\n                continue\n\n            # Do the histogram computation\n            heights, (x_edges, y_edges) = estimator(\n                sub_data[\"x\"],\n                sub_data[\"y\"],\n                weights=sub_data.get(\"weights\", None),\n            )\n\n            # Check for log scaling on the data axis\n            if self._log_scaled(\"x\"):\n                x_edges = np.power(10, x_edges)\n            if self._log_scaled(\"y\"):\n                y_edges = np.power(10, y_edges)\n\n            # Apply scaling to normalize across groups\n            if estimator.stat != \"count\" and common_norm:\n                heights *= len(sub_data) / len(all_data)\n\n            # Define the specific kwargs for this artist\n            artist_kws = plot_kws.copy()\n            if \"hue\" in self.variables:\n                color = self._hue_map(sub_vars[\"hue\"])\n                cmap = self._cmap_from_color(color)\n                artist_kws[\"cmap\"] = cmap\n            else:\n                cmap = artist_kws.pop(\"cmap\", None)\n                if isinstance(cmap, str):\n                    cmap = color_palette(cmap, as_cmap=True)\n                elif cmap is None:\n                    cmap = self._cmap_from_color(color)\n                artist_kws[\"cmap\"] = cmap\n\n            # Set the upper norm on the colormap\n            if not common_color_norm and pmax is not None:\n                vmax = self._quantile_to_level(heights, pmax)\n            if vmax is not None:\n                artist_kws[\"vmax\"] = vmax\n\n            # Make cells at or below the threshold transparent\n            if not common_color_norm and pthresh:\n                thresh = self._quantile_to_level(heights, pthresh)\n            if thresh is not None:\n                heights = np.ma.masked_less_equal(heights, thresh)\n\n            # Get the axes for this plot\n            ax = self._get_axes(sub_vars)\n\n            # pcolormesh is going to turn the grid off, but we want to keep it\n            # I'm not sure if there's a better way to get the grid state\n            x_grid = any([l.get_visible() for l in ax.xaxis.get_gridlines()])\n            y_grid = any([l.get_visible() for l in ax.yaxis.get_gridlines()])\n\n            mesh = ax.pcolormesh(\n                x_edges,\n                y_edges,\n                heights.T,\n                **artist_kws,\n            )\n\n            # pcolormesh sets sticky edges, but we only want them if not thresholding\n            if thresh is not None:\n                mesh.sticky_edges.x[:] = []\n                mesh.sticky_edges.y[:] = []\n\n            # Add an optional colorbar\n            # Note, we want to improve this. When hue is used, it will stack\n            # multiple colorbars with redundant ticks in an ugly way.\n            # But it's going to take some work to have multiple colorbars that\n            # share ticks nicely.\n            if cbar:\n                ax.figure.colorbar(mesh, cbar_ax, ax, **cbar_kws)\n\n            # Reset the grid state\n            if x_grid:\n                ax.grid(True, axis=\"x\")\n            if y_grid:\n                ax.grid(True, axis=\"y\")\n\n        # --- Finalize the plot\n\n        ax = self.ax if self.ax is not None else self.facets.axes.flat[0]\n        self._add_axis_labels(ax)\n\n        if \"hue\" in self.variables and legend:\n\n            # TODO if possible, I would like to move the contour\n            # intensity information into the legend too and label the\n            # iso proportions rather than the raw density values\n\n            artist_kws = {}\n            artist = partial(mpl.patches.Patch)\n            ax_obj = self.ax if self.ax is not None else self.facets\n            self._add_legend(\n                ax_obj, artist, True, False, \"layer\", 1, artist_kws, {},\n            )"
        }
      ]
    },
    {
      "pr_number": 2417,
      "pr_title": "Improve NA robustness in VectorPlotter.comp_data",
      "pr_body": "This PR avoids passing `nan` through the matplotlib converters used to obtain a numeric/computable representation of the data (i.e. `VectorPlotter.comp_data`).\r\n\r\nIt also\r\n- codifies that the converted columns in `comp_data` have a float dtype\r\n- converts `inf` to `nan`, in line with what matplotlib does\r\n\r\nFixes #2295 \r\n\r\nAdditionally this will implicitly address #1971 once the regression plots are refactored to use `comp_data` internally. (@mojones, funny that you opened both issues).",
      "issue_id": 2295,
      "issue_title": "histplot with categorical values crashes with missing data, though numerical values work fine",
      "issue_body": "Not sure if this is intended behaviour, but it caught me out due to the difference in handling numerical/categorical data. I note that drawing histograms of categorical data is labelled as experimental, so ignore/close if that explains it.\r\n\r\nWith numerical data `histplot` ignores NaN and plots the other values, this is the behaviour I would expect:\r\n\r\n```\r\nimport numpy as np\r\nimport seaborn as sns\r\n\r\nsns.histplot(\r\n    [1.1, 1.2, 1.3, 1.4, np.nan]\r\n)\r\n```\r\n\r\nbut with categorical data it crashes:\r\n```\r\nimport numpy as np\r\nimport seaborn as sns\r\n\r\nsns.histplot(\r\n    ['foo', 'foo', 'bar', np.nan]\r\n)\r\n\r\n# output\r\n---------------------------------------------------------------------------\r\nTypeError                                 Traceback (most recent call last)\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/matplotlib/axis.py in convert_units(self, x)\r\n   1519         try:\r\n-> 1520             ret = self.converter.convert(x, self.units, self)\r\n   1521         except Exception as e:\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/matplotlib/category.py in convert(value, unit, axis)\r\n     60         # force an update so it also does type checking\r\n---> 61         unit.update(values)\r\n     62         return np.vectorize(unit._mapping.__getitem__, otypes=[float])(values)\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/matplotlib/category.py in update(self, data)\r\n    210             # OrderedDict just iterates over unique values in data.\r\n--> 211             cbook._check_isinstance((str, bytes), value=val)\r\n    212             if convertible:\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/matplotlib/cbook/__init__.py in _check_isinstance(_types, **kwargs)\r\n   2234         if not isinstance(v, types):\r\n-> 2235             raise TypeError(\r\n   2236                 \"{!r} must be an instance of {}, not a {}\".format(\r\n\r\nTypeError: 'value' must be an instance of str or bytes, not a float\r\n\r\nThe above exception was the direct cause of the following exception:\r\n\r\nConversionError                           Traceback (most recent call last)\r\n<ipython-input-61-b132ea7dca6c> in <module>\r\n      2 import seaborn as sns\r\n      3 \r\n----> 4 sns.histplot(\r\n      5     ['foo', 'foo', 'bar', np.nan]\r\n      6 )\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/seaborn/distributions.py in histplot(data, x, y, hue, weights, stat, bins, binwidth, binrange, discrete, cumulative, common_bins, common_norm, multiple, element, fill, shrink, kde, kde_kws, line_kws, thresh, pthresh, pmax, cbar, cbar_ax, cbar_kws, palette, hue_order, hue_norm, color, log_scale, legend, ax, **kwargs)\r\n   1420     if p.univariate:\r\n   1421 \r\n-> 1422         p.plot_univariate_histogram(\r\n   1423             multiple=multiple,\r\n   1424             element=element,\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/seaborn/distributions.py in plot_univariate_histogram(self, multiple, element, fill, common_norm, common_bins, shrink, kde, kde_kws, color, legend, line_kws, estimate_kws, **plot_kws)\r\n    421 \r\n    422         # First pass through the data to compute the histograms\r\n--> 423         for sub_vars, sub_data in self.iter_data(\"hue\", from_comp_data=True):\r\n    424 \r\n    425             # Prepare the relevant data\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/seaborn/_core.py in iter_data(self, grouping_vars, reverse, from_comp_data)\r\n    965 \r\n    966         if from_comp_data:\r\n--> 967             data = self.comp_data\r\n    968         else:\r\n    969             data = self.plot_data\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/seaborn/_core.py in comp_data(self)\r\n   1034                 axis = getattr(ax, f\"{var}axis\")\r\n   1035 \r\n-> 1036                 comp_var = axis.convert_units(self.plot_data[var])\r\n   1037                 if axis.get_scale() == \"log\":\r\n   1038                     comp_var = np.log10(comp_var)\r\n\r\n~/.virtualenvs/drawingfromdata/lib/python3.8/site-packages/matplotlib/axis.py in convert_units(self, x)\r\n   1520             ret = self.converter.convert(x, self.units, self)\r\n   1521         except Exception as e:\r\n-> 1522             raise munits.ConversionError('Failed to convert value(s) to axis '\r\n   1523                                          f'units: {x!r}') from e\r\n   1524         return ret\r\n\r\nConversionError: Failed to convert value(s) to axis units: 0    foo\r\n1    foo\r\n2    bar\r\n3    NaN\r\nName: x, dtype: object\r\n```\r\n\r\n",
      "issue_closed_at": "2021-01-05T19:40:57Z",
      "base_commit": "aad96f8d2e36ceceb82a42b69aa3a8f47ef7210d",
      "changes": [
        {
          "file": "seaborn/_core.py",
          "type": "function",
          "name": "comp_data",
          "class_name": "VectorPlotter",
          "code": "def comp_data(self):\n        \"\"\"Dataframe with numeric x and y, after unit conversion and log scaling.\"\"\"\n        if not hasattr(self, \"ax\"):\n            # Probably a good idea, but will need a bunch of tests updated\n            # Most of these tests should just use the external interface\n            # Then this can be re-enabled.\n            # raise AttributeError(\"No Axes attached to plotter\")\n            return self.plot_data\n\n        if not hasattr(self, \"_comp_data\"):\n\n            comp_data = (\n                self.plot_data\n                .copy(deep=False)\n                .drop([\"x\", \"y\"], axis=1, errors=\"ignore\")\n            )\n            for var in \"yx\":\n                if var not in self.variables:\n                    continue\n\n                # Get a corresponding axis object so that we can convert the units\n                # to matplotlib's numeric representation, which we can compute on\n                # This is messy and it would probably be better for VectorPlotter\n                # to manage its own converters (using the matplotlib tools).\n                # XXX Currently does not support unshared categorical axes!\n                # (But see comment in _attach about how those don't exist)\n                if self.ax is None:\n                    ax = self.facets.axes.flat[0]\n                else:\n                    ax = self.ax\n                axis = getattr(ax, f\"{var}axis\")\n\n                comp_var = axis.convert_units(self.plot_data[var])\n                if axis.get_scale() == \"log\":\n                    comp_var = np.log10(comp_var)\n                comp_data.insert(0, var, comp_var)\n\n            self._comp_data = comp_data\n\n        return self._comp_data"
        }
      ]
    },
    {
      "pr_number": 3065,
      "pr_title": "Fix unfilled kdeplot cmap regression",
      "pr_body": "Fixes #3058\r\n\r\n```python\r\ngeyser = sns.load_dataset(\"geyser\")\r\nsns.kdeplot(geyser, x=\"waiting\", y=\"duration\", cmap=\"viridis\")\r\n```\r\n\r\n![image](https://user-images.githubusercontent.com/315810/194729481-110b8da9-7a97-4109-9063-a9d47c74dd5d.png)\r\n",
      "issue_id": 3058,
      "issue_title": "unable to plot with custom color ramp seaborn 0.12.0",
      "issue_body": "I was trying to use seaborn kdeplot with custom colour ramp, it is working with seaboarn version 0.11.00, but not with seaboarn 0.12.0\r\n\r\n**color ramp as below** \r\n```\r\ndef make_Ramp( ramp_colors ): \r\n    from colour import Color\r\n    from matplotlib.colors import LinearSegmentedColormap\r\n\r\n    color_ramp = LinearSegmentedColormap.from_list( 'my_list', [ Color( c1 ).rgb for c1 in ramp_colors ] )\r\n    plt.figure( figsize = (15,3))\r\n    plt.imshow( [list(np.arange(0, len( ramp_colors ) , 0.1)) ] , interpolation='nearest', origin='lower', cmap= color_ramp )\r\n    plt.xticks([])\r\n    plt.yticks([])\r\n    return color_ramp\r\n\r\ncustom_ramp = make_Ramp( ['#0000ff','#00ffff','#ffff00','#ff0000' ] ) \r\n```\r\n\r\nmy data look like this\r\n```\r\n\r\n            0        1         2\r\n0    142.5705  38.5744  hairpins\r\n1    281.0795  55.1900  hairpins\r\n2    101.7282  49.5604  hairpins\r\n3     59.8472  63.0699  hairpins\r\n4    296.4381  44.8293  hairpins\r\n..        ...      ...       ...\r\n347  284.6841  51.7468     stems\r\n348  288.7241  49.9322     stems\r\n349  320.2972  41.5520     stems\r\n350  302.6805  67.2658     stems\r\n351  293.6837  52.0663     stems\r\n\r\n[352 rows x 3 columns]\r\n<class 'numpy.float64'>\r\n```\r\n\r\n**this is my code**\r\n\r\n`ax = sns.kdeplot(data=df, x=df.loc[df[2] == \"hairpins\", 0], y=df.loc[df[2] == \"hairpins\", 1], fill=False, thresh=0, levels=20, cmap=custom_ramp, common_norm=True, cbar=True, )`\r\n\r\n**with version 0.12.0 get this error**\r\n\r\n```\r\n\r\n---------------------------------------------------------------------------\r\nAttributeError                            Traceback (most recent call last)\r\n[<ipython-input-6-88652c0ba7ce>](https://localhost:8080/#) in <module>\r\n     21   #/\r\n     22     plt.subplot(2,3,i+1)\r\n---> 23     ax = sns.kdeplot(data=df, x=df.loc[df[2] == dimtypes[i], 0], y=df.loc[df[2] == dimtypes[i], 1], fill=False, thresh=0, levels=20, cmap=custom_ramp, common_norm=True, cbar=True, cbar_kws={'format': '%2.1e', 'label': 'kernel density'} )\r\n     24     plt.title(\"Chart {}: {}\".format(i+1, dimtypes[i]), size=20)\r\n     25     plt.xlabel(str(xname), fontsize=12)\r\n\r\n9 frames\r\n[/usr/local/lib/python3.7/dist-packages/matplotlib/artist.py](https://localhost:8080/#) in update(self, props)\r\n   1065                     func = getattr(self, f\"set_{k}\", None)\r\n   1066                     if not callable(func):\r\n-> 1067                         raise AttributeError(f\"{type(self).__name__!r} object \"\r\n   1068                                              f\"has no property {k!r}\")\r\n   1069                     ret.append(func(v))\r\n\r\nAttributeError: 'Line2D' object has no property 'cmap'\r\n```\r\n\r\n**with version 0.11.0 get this plot**\r\n\r\n![image](https://user-images.githubusercontent.com/67545640/194606070-fc6a1d26-0d2d-48e9-b371-eff69c69b4b6.png)\r\n\r\nbasically, custom ramp is not woking with seaborn 0.12.0 , please update thanks\r\n",
      "issue_closed_at": "2022-10-08T23:02:17Z",
      "base_commit": "c412ddf1fede5d8882a6c230826c1d8fbbf61911",
      "changes": [
        {
          "file": "seaborn/distributions.py",
          "type": "function",
          "name": "plot_bivariate_density",
          "class_name": "_DistributionPlotter",
          "code": "def plot_bivariate_density(\n        self,\n        common_norm,\n        fill,\n        levels,\n        thresh,\n        color,\n        legend,\n        cbar,\n        warn_singular,\n        cbar_ax,\n        cbar_kws,\n        estimate_kws,\n        **contour_kws,\n    ):\n\n        contour_kws = contour_kws.copy()\n\n        estimator = KDE(**estimate_kws)\n\n        if not set(self.variables) - {\"x\", \"y\"}:\n            common_norm = False\n\n        all_data = self.plot_data.dropna()\n\n        # Loop through the subsets and estimate the KDEs\n        densities, supports = {}, {}\n\n        for sub_vars, sub_data in self.iter_data(\"hue\", from_comp_data=True):\n\n            # Extract the data points from this sub set\n            observations = sub_data[[\"x\", \"y\"]]\n            min_variance = observations.var().fillna(0).min()\n            observations = observations[\"x\"], observations[\"y\"]\n\n            # Extract the weights for this subset of observations\n            if \"weights\" in self.variables:\n                weights = sub_data[\"weights\"]\n            else:\n                weights = None\n\n            # Estimate the density of observations at this level\n            singular = math.isclose(min_variance, 0)\n            try:\n                if not singular:\n                    density, support = estimator(*observations, weights=weights)\n            except np.linalg.LinAlgError:\n                # Testing for 0 variance doesn't catch all cases where scipy raises,\n                # but we can also get a ValueError, so we need this convoluted approach\n                singular = True\n\n            if singular:\n                msg = (\n                    \"KDE cannot be estimated (0 variance or perfect covariance). \"\n                    \"Pass `warn_singular=False` to disable this warning.\"\n                )\n                if warn_singular:\n                    warnings.warn(msg, UserWarning, stacklevel=3)\n                continue\n\n            # Transform the support grid back to the original scale\n            xx, yy = support\n            if self._log_scaled(\"x\"):\n                xx = np.power(10, xx)\n            if self._log_scaled(\"y\"):\n                yy = np.power(10, yy)\n            support = xx, yy\n\n            # Apply a scaling factor so that the integral over all subsets is 1\n            if common_norm:\n                density *= len(sub_data) / len(all_data)\n\n            key = tuple(sub_vars.items())\n            densities[key] = density\n            supports[key] = support\n\n        # Define a grid of iso-proportion levels\n        if thresh is None:\n            thresh = 0\n        if isinstance(levels, Number):\n            levels = np.linspace(thresh, 1, levels)\n        else:\n            if min(levels) < 0 or max(levels) > 1:\n                raise ValueError(\"levels must be in [0, 1]\")\n\n        # Transform from iso-proportions to iso-densities\n        if common_norm:\n            common_levels = self._quantile_to_level(\n                list(densities.values()), levels,\n            )\n            draw_levels = {k: common_levels for k in densities}\n        else:\n            draw_levels = {\n                k: self._quantile_to_level(d, levels)\n                for k, d in densities.items()\n            }\n\n        # Get a default single color from the attribute cycle\n        if self.ax is None:\n            default_color = \"C0\" if color is None else color\n        else:\n            scout, = self.ax.plot([], color=color)\n            default_color = scout.get_color()\n            scout.remove()\n\n        # Define the coloring of the contours\n        if \"hue\" in self.variables:\n            for param in [\"cmap\", \"colors\"]:\n                if param in contour_kws:\n                    msg = f\"{param} parameter ignored when using hue mapping.\"\n                    warnings.warn(msg, UserWarning)\n                    contour_kws.pop(param)\n        else:\n\n            # Work out a default coloring of the contours\n            coloring_given = set(contour_kws) & {\"cmap\", \"colors\"}\n            if fill and not coloring_given:\n                cmap = self._cmap_from_color(default_color)\n                contour_kws[\"cmap\"] = cmap\n            if not fill and not coloring_given:\n                contour_kws[\"colors\"] = [default_color]\n\n            # Use our internal colormap lookup\n            cmap = contour_kws.pop(\"cmap\", None)\n            if isinstance(cmap, str):\n                cmap = color_palette(cmap, as_cmap=True)\n            if cmap is not None:\n                contour_kws[\"cmap\"] = cmap\n\n        # Loop through the subsets again and plot the data\n        for sub_vars, _ in self.iter_data(\"hue\"):\n\n            if \"hue\" in sub_vars:\n                color = self._hue_map(sub_vars[\"hue\"])\n                if fill:\n                    contour_kws[\"cmap\"] = self._cmap_from_color(color)\n                else:\n                    contour_kws[\"colors\"] = [color]\n\n            ax = self._get_axes(sub_vars)\n\n            # Choose the function to plot with\n            # TODO could add a pcolormesh based option as well\n            # Which would look something like element=\"raster\"\n            if fill:\n                contour_func = ax.contourf\n            else:\n                contour_func = ax.contour\n\n            key = tuple(sub_vars.items())\n            if key not in densities:\n                continue\n            density = densities[key]\n            xx, yy = supports[key]\n\n            label = contour_kws.pop(\"label\", None)\n\n            cset = contour_func(\n                xx, yy, density,\n                levels=draw_levels[key],\n                **contour_kws,\n            )\n\n            if \"hue\" not in self.variables:\n                cset.collections[0].set_label(label)\n\n            # Add a color bar representing the contour heights\n            # Note: this shows iso densities, not iso proportions\n            # See more notes in histplot about how this could be improved\n            if cbar:\n                cbar_kws = {} if cbar_kws is None else cbar_kws\n                ax.figure.colorbar(cset, cbar_ax, ax, **cbar_kws)\n\n        # --- Finalize the plot\n        ax = self.ax if self.ax is not None else self.facets.axes.flat[0]\n        self._add_axis_labels(ax)\n\n        if \"hue\" in self.variables and legend:\n\n            # TODO if possible, I would like to move the contour\n            # intensity information into the legend too and label the\n            # iso proportions rather than the raw density values\n\n            artist_kws = {}\n            if fill:\n                artist = partial(mpl.patches.Patch)\n            else:\n                artist = partial(mpl.lines.Line2D, [], [])\n\n            ax_obj = self.ax if self.ax is not None else self.facets\n            self._add_legend(\n                ax_obj, artist, fill, False, \"layer\", 1, artist_kws, {},\n            )"
        },
        {
          "file": "seaborn/distributions.py",
          "type": "function",
          "name": "plot_bivariate_density",
          "class_name": "_DistributionPlotter",
          "code": "def plot_bivariate_density(\n        self,\n        common_norm,\n        fill,\n        levels,\n        thresh,\n        color,\n        legend,\n        cbar,\n        warn_singular,\n        cbar_ax,\n        cbar_kws,\n        estimate_kws,\n        **contour_kws,\n    ):\n\n        contour_kws = contour_kws.copy()\n\n        estimator = KDE(**estimate_kws)\n\n        if not set(self.variables) - {\"x\", \"y\"}:\n            common_norm = False\n\n        all_data = self.plot_data.dropna()\n\n        # Loop through the subsets and estimate the KDEs\n        densities, supports = {}, {}\n\n        for sub_vars, sub_data in self.iter_data(\"hue\", from_comp_data=True):\n\n            # Extract the data points from this sub set\n            observations = sub_data[[\"x\", \"y\"]]\n            min_variance = observations.var().fillna(0).min()\n            observations = observations[\"x\"], observations[\"y\"]\n\n            # Extract the weights for this subset of observations\n            if \"weights\" in self.variables:\n                weights = sub_data[\"weights\"]\n            else:\n                weights = None\n\n            # Estimate the density of observations at this level\n            singular = math.isclose(min_variance, 0)\n            try:\n                if not singular:\n                    density, support = estimator(*observations, weights=weights)\n            except np.linalg.LinAlgError:\n                # Testing for 0 variance doesn't catch all cases where scipy raises,\n                # but we can also get a ValueError, so we need this convoluted approach\n                singular = True\n\n            if singular:\n                msg = (\n                    \"KDE cannot be estimated (0 variance or perfect covariance). \"\n                    \"Pass `warn_singular=False` to disable this warning.\"\n                )\n                if warn_singular:\n                    warnings.warn(msg, UserWarning, stacklevel=3)\n                continue\n\n            # Transform the support grid back to the original scale\n            xx, yy = support\n            if self._log_scaled(\"x\"):\n                xx = np.power(10, xx)\n            if self._log_scaled(\"y\"):\n                yy = np.power(10, yy)\n            support = xx, yy\n\n            # Apply a scaling factor so that the integral over all subsets is 1\n            if common_norm:\n                density *= len(sub_data) / len(all_data)\n\n            key = tuple(sub_vars.items())\n            densities[key] = density\n            supports[key] = support\n\n        # Define a grid of iso-proportion levels\n        if thresh is None:\n            thresh = 0\n        if isinstance(levels, Number):\n            levels = np.linspace(thresh, 1, levels)\n        else:\n            if min(levels) < 0 or max(levels) > 1:\n                raise ValueError(\"levels must be in [0, 1]\")\n\n        # Transform from iso-proportions to iso-densities\n        if common_norm:\n            common_levels = self._quantile_to_level(\n                list(densities.values()), levels,\n            )\n            draw_levels = {k: common_levels for k in densities}\n        else:\n            draw_levels = {\n                k: self._quantile_to_level(d, levels)\n                for k, d in densities.items()\n            }\n\n        # Get a default single color from the attribute cycle\n        if self.ax is None:\n            default_color = \"C0\" if color is None else color\n        else:\n            scout, = self.ax.plot([], color=color)\n            default_color = scout.get_color()\n            scout.remove()\n\n        # Define the coloring of the contours\n        if \"hue\" in self.variables:\n            for param in [\"cmap\", \"colors\"]:\n                if param in contour_kws:\n                    msg = f\"{param} parameter ignored when using hue mapping.\"\n                    warnings.warn(msg, UserWarning)\n                    contour_kws.pop(param)\n        else:\n\n            # Work out a default coloring of the contours\n            coloring_given = set(contour_kws) & {\"cmap\", \"colors\"}\n            if fill and not coloring_given:\n                cmap = self._cmap_from_color(default_color)\n                contour_kws[\"cmap\"] = cmap\n            if not fill and not coloring_given:\n                contour_kws[\"colors\"] = [default_color]\n\n            # Use our internal colormap lookup\n            cmap = contour_kws.pop(\"cmap\", None)\n            if isinstance(cmap, str):\n                cmap = color_palette(cmap, as_cmap=True)\n            if cmap is not None:\n                contour_kws[\"cmap\"] = cmap\n\n        # Loop through the subsets again and plot the data\n        for sub_vars, _ in self.iter_data(\"hue\"):\n\n            if \"hue\" in sub_vars:\n                color = self._hue_map(sub_vars[\"hue\"])\n                if fill:\n                    contour_kws[\"cmap\"] = self._cmap_from_color(color)\n                else:\n                    contour_kws[\"colors\"] = [color]\n\n            ax = self._get_axes(sub_vars)\n\n            # Choose the function to plot with\n            # TODO could add a pcolormesh based option as well\n            # Which would look something like element=\"raster\"\n            if fill:\n                contour_func = ax.contourf\n            else:\n                contour_func = ax.contour\n\n            key = tuple(sub_vars.items())\n            if key not in densities:\n                continue\n            density = densities[key]\n            xx, yy = supports[key]\n\n            label = contour_kws.pop(\"label\", None)\n\n            cset = contour_func(\n                xx, yy, density,\n                levels=draw_levels[key],\n                **contour_kws,\n            )\n\n            if \"hue\" not in self.variables:\n                cset.collections[0].set_label(label)\n\n            # Add a color bar representing the contour heights\n            # Note: this shows iso densities, not iso proportions\n            # See more notes in histplot about how this could be improved\n            if cbar:\n                cbar_kws = {} if cbar_kws is None else cbar_kws\n                ax.figure.colorbar(cset, cbar_ax, ax, **cbar_kws)\n\n        # --- Finalize the plot\n        ax = self.ax if self.ax is not None else self.facets.axes.flat[0]\n        self._add_axis_labels(ax)\n\n        if \"hue\" in self.variables and legend:\n\n            # TODO if possible, I would like to move the contour\n            # intensity information into the legend too and label the\n            # iso proportions rather than the raw density values\n\n            artist_kws = {}\n            if fill:\n                artist = partial(mpl.patches.Patch)\n            else:\n                artist = partial(mpl.lines.Line2D, [], [])\n\n            ax_obj = self.ax if self.ax is not None else self.facets\n            self._add_legend(\n                ax_obj, artist, fill, False, \"layer\", 1, artist_kws, {},\n            )"
        },
        {
          "file": "seaborn/utils.py",
          "type": "function",
          "name": "_default_color",
          "class_name": null,
          "code": "def _default_color(method, hue, color, kws):\n    \"\"\"If needed, get a default color by using the matplotlib property cycle.\"\"\"\n    if hue is not None:\n        # This warning is probably user-friendly, but it's currently triggered\n        # in a FacetGrid context and I don't want to mess with that logic right now\n        #  if color is not None:\n        #      msg = \"`color` is ignored when `hue` is assigned.\"\n        #      warnings.warn(msg)\n        return None\n\n    if color is not None:\n        return color\n\n    elif method.__name__ == \"plot\":\n\n        scout, = method([], [], scalex=False, scaley=False, **kws)\n        color = scout.get_color()\n        scout.remove()\n\n    elif method.__name__ == \"scatter\":\n\n        # Matplotlib will raise if the size of x/y don't match s/c,\n        # and the latter might be in the kws dict\n        scout_size = max(\n            np.atleast_1d(kws.get(key, [])).shape[0]\n            for key in [\"s\", \"c\", \"fc\", \"facecolor\", \"facecolors\"]\n        )\n        scout_x = scout_y = np.full(scout_size, np.nan)\n\n        scout = method(scout_x, scout_y, **kws)\n        facecolors = scout.get_facecolors()\n\n        if not len(facecolors):\n            # Handle bug in matplotlib <= 3.2 (I think)\n            # This will limit the ability to use non color= kwargs to specify\n            # a color in versions of matplotlib with the bug, but trying to\n            # work out what the user wanted by re-implementing the broken logic\n            # of inspecting the kwargs is probably too brittle.\n            single_color = False\n        else:\n            single_color = np.unique(facecolors, axis=0).shape[0] == 1\n\n        # Allow the user to specify an array of colors through various kwargs\n        if \"c\" not in kws and single_color:\n            color = to_rgb(facecolors[0])\n\n        scout.remove()\n\n    elif method.__name__ == \"bar\":\n\n        # bar() needs masked, not empty data, to generate a patch\n        scout, = method([np.nan], [np.nan], **kws)\n        color = to_rgb(scout.get_facecolor())\n        scout.remove()\n\n    elif method.__name__ == \"fill_between\":\n\n        # There is a bug on matplotlib < 3.3 where fill_between with\n        # datetime units and empty data will set incorrect autoscale limits\n        # To workaround it, we'll always return the first color in the cycle.\n        # https://github.com/matplotlib/matplotlib/issues/17586\n        ax = method.__self__\n        datetime_axis = any([\n            isinstance(ax.xaxis.converter, mpl.dates.DateConverter),\n            isinstance(ax.yaxis.converter, mpl.dates.DateConverter),\n        ])\n        if Version(mpl.__version__) < Version(\"3.3\") and datetime_axis:\n            return \"C0\"\n\n        kws = _normalize_kwargs(kws, mpl.collections.PolyCollection)\n\n        scout = method([], [], **kws)\n        facecolor = scout.get_facecolor()\n        color = to_rgb(facecolor[0])\n        scout.remove()\n\n    return color"
        }
      ]
    },
    {
      "pr_number": 2979,
      "pr_title": "Fix visibility of internal axis labels with Plot.pair(wrap=...)",
      "pr_body": "\r\n1. Fix visibility of internal axis labels with `Plot.pair(wrap=...)`  (Closes #2976)\r\n\r\n```python\r\n(\r\n    so.Plot(mpg, y=\"mpg\")\r\n    .pair([\"displacement\", \"weight\", \"horsepower\", \"acceleration\"], wrap=2)\r\n    .add(so.Dots())\r\n)\r\n```\r\n![image](https://user-images.githubusercontent.com/315810/186991689-69c61e56-3054-49b3-ad87-7797198b1cd1.png)\r\n\r\n2. Fix (non-)sharing of axes for distinct variables with `Plot.pair(wrap=1)`\r\n\r\n```python\r\n(\r\n    so.Plot(mpg, x=\"mpg\")\r\n    .pair(y=[\"displacement\", \"weight\"], wrap=1)\r\n    .add(so.Dots())\r\n)\r\n```\r\n![image](https://user-images.githubusercontent.com/315810/186991550-5be28208-c5aa-4d47-b2c6-a36e0f1fe59b.png)\r\n",
      "issue_id": 2976,
      "issue_title": "Visibility of internal axis labels is wrong with wrapped pair plot",
      "issue_body": "```python\r\n(\r\n    so.Plot(mpg, y=\"mpg\")\r\n    .pair([\"displacement\", \"weight\", \"horsepower\", \"cylinders\"], wrap=2)\r\n)\r\n```\r\n![image](https://user-images.githubusercontent.com/315810/186793170-dedae71a-2cb9-4f0e-9339-07fc1d13ac59.png)\r\n\r\nThe top two subplots should have distinct x labels.",
      "issue_closed_at": "2022-08-27T00:31:23Z",
      "base_commit": "ebc4bfe9f8bf5c4ff10b14da8a49c8baa1ba76d0",
      "changes": [
        {
          "file": "seaborn/_core/plot.py",
          "type": "function",
          "name": "_setup_figure",
          "class_name": "Plotter",
          "code": "def _setup_figure(self, p: Plot, common: PlotData, layers: list[Layer]) -> None:\n\n        # --- Parsing the faceting/pairing parameterization to specify figure grid\n\n        subplot_spec = p._subplot_spec.copy()\n        facet_spec = p._facet_spec.copy()\n        pair_spec = p._pair_spec.copy()\n\n        for axis in \"xy\":\n            if axis in p._shares:\n                subplot_spec[f\"share{axis}\"] = p._shares[axis]\n\n        for dim in [\"col\", \"row\"]:\n            if dim in common.frame and dim not in facet_spec[\"structure\"]:\n                order = categorical_order(common.frame[dim])\n                facet_spec[\"structure\"][dim] = order\n\n        self._subplots = subplots = Subplots(subplot_spec, facet_spec, pair_spec)\n\n        # --- Figure initialization\n        self._figure = subplots.init_figure(\n            pair_spec, self._pyplot, p._figure_spec, p._target,\n        )\n\n        # --- Figure annotation\n        for sub in subplots:\n            ax = sub[\"ax\"]\n            for axis in \"xy\":\n                axis_key = sub[axis]\n\n                # ~~ Axis labels\n\n                # TODO Should we make it possible to use only one x/y label for\n                # all rows/columns in a faceted plot? Maybe using sub{axis}label,\n                # although the alignments of the labels from that method leaves\n                # something to be desired (in terms of how it defines 'centered').\n                names = [\n                    common.names.get(axis_key),\n                    *(layer[\"data\"].names.get(axis_key) for layer in layers)\n                ]\n                auto_label = next((name for name in names if name is not None), None)\n                label = self._resolve_label(p, axis_key, auto_label)\n                ax.set(**{f\"{axis}label\": label})\n\n                # ~~ Decoration visibility\n\n                # TODO there should be some override (in Plot.layout?) so that\n                # tick labels can be shown on interior shared axes\n                axis_obj = getattr(ax, f\"{axis}axis\")\n                visible_side = {\"x\": \"bottom\", \"y\": \"left\"}.get(axis)\n                show_axis_label = (\n                    sub[visible_side]\n                    or axis in p._pair_spec and bool(p._pair_spec.get(\"wrap\"))\n                    or not p._pair_spec.get(\"cross\", True)\n                )\n                axis_obj.get_label().set_visible(show_axis_label)\n                show_tick_labels = (\n                    show_axis_label\n                    or subplot_spec.get(f\"share{axis}\") not in (\n                        True, \"all\", {\"x\": \"col\", \"y\": \"row\"}[axis]\n                    )\n                )\n                for group in (\"major\", \"minor\"):\n                    for t in getattr(axis_obj, f\"get_{group}ticklabels\")():\n                        t.set_visible(show_tick_labels)\n\n            # TODO we want right-side titles for row facets in most cases?\n            # Let's have what we currently call \"margin titles\" but properly using the\n            # ax.set_title interface (see my gist)\n            title_parts = []\n            for dim in [\"col\", \"row\"]:\n                if sub[dim] is not None:\n                    val = self._resolve_label(p, \"title\", f\"{sub[dim]}\")\n                    if dim in p._labels:\n                        key = self._resolve_label(p, dim, common.names.get(dim))\n                        val = f\"{key} {val}\"\n                    title_parts.append(val)\n\n            has_col = sub[\"col\"] is not None\n            has_row = sub[\"row\"] is not None\n            show_title = (\n                has_col and has_row\n                or (has_col or has_row) and p._facet_spec.get(\"wrap\")\n                or (has_col and sub[\"top\"])\n                # TODO or has_row and sub[\"right\"] and <right titles>\n                or has_row  # TODO and not <right titles>\n            )\n            if title_parts:\n                title = \" | \".join(title_parts)\n                title_text = ax.set_title(title)\n                title_text.set_visible(show_title)\n            elif not (has_col or has_row):\n                title = self._resolve_label(p, \"title\", None)\n                title_text = ax.set_title(title)"
        },
        {
          "file": "seaborn/_core/plot.py",
          "type": "function",
          "name": "_setup_scales",
          "class_name": "Plotter",
          "code": "def _setup_scales(\n        self, p: Plot,\n        common: PlotData,\n        layers: list[Layer],\n        variables: list[str] | None = None,\n    ) -> None:\n\n        if variables is None:\n            # Add variables that have data but not a scale, which happens\n            # because this method can be called multiple time, to handle\n            # variables added during the Stat transform.\n            variables = []\n            for layer in layers:\n                variables.extend(layer[\"data\"].frame.columns)\n                for df in layer[\"data\"].frames.values():\n                    variables.extend(v for v in df if v not in variables)\n            variables = [v for v in variables if v not in self._scales]\n\n        for var in variables:\n\n            # Determine whether this is a coordinate variable\n            # (i.e., x/y, paired x/y, or derivative such as xmax)\n            m = re.match(r\"^(?P<coord>(?P<axis>x|y)\\d*).*\", var)\n            if m is None:\n                coord = axis = None\n            else:\n                coord = m[\"coord\"]\n                axis = m[\"axis\"]\n\n            # Get keys that handle things like x0, xmax, properly where relevant\n            prop_key = var if axis is None else axis\n            scale_key = var if coord is None else coord\n\n            if prop_key not in PROPERTIES:\n                continue\n\n            # Concatenate layers, using only the relevant coordinate and faceting vars,\n            # This is unnecessarily wasteful, as layer data will often be redundant.\n            # But figuring out the minimal amount we need is more complicated.\n            cols = [var, \"col\", \"row\"]\n            parts = [common.frame.filter(cols)]\n            for layer in layers:\n                parts.append(layer[\"data\"].frame.filter(cols))\n                for df in layer[\"data\"].frames.values():\n                    parts.append(df.filter(cols))\n            var_df = pd.concat(parts, ignore_index=True)\n\n            prop = PROPERTIES[prop_key]\n            scale = self._get_scale(p, scale_key, prop, var_df[var])\n\n            if scale_key not in p._variables:\n                # TODO this implies that the variable was added by the stat\n                # It allows downstream orientation inference to work properly.\n                # But it feels rather hacky, so ideally revisit.\n                scale._priority = 0  # type: ignore\n\n            if axis is None:\n                # We could think about having a broader concept of (un)shared properties\n                # In general, not something you want to do (different scales in facets)\n                # But could make sense e.g. with paired plots. Build later.\n                share_state = None\n                subplots = []\n            else:\n                share_state = self._subplots.subplot_spec[f\"share{axis}\"]\n                subplots = [view for view in self._subplots if view[axis] == coord]\n\n            # Shared categorical axes are broken on matplotlib<3.4.0.\n            # https://github.com/matplotlib/matplotlib/pull/18308\n            # This only affects us when sharing *paired* axes. This is a novel/niche\n            # behavior, so we will raise rather than hack together a workaround.\n            if axis is not None and Version(mpl.__version__) < Version(\"3.4.0\"):\n                from seaborn._core.scales import Nominal\n                paired_axis = axis in p._pair_spec\n                cat_scale = isinstance(scale, Nominal)\n                ok_dim = {\"x\": \"col\", \"y\": \"row\"}[axis]\n                shared_axes = share_state not in [False, \"none\", ok_dim]\n                if paired_axis and cat_scale and shared_axes:\n                    err = \"Sharing paired categorical axes requires matplotlib>=3.4.0\"\n                    raise RuntimeError(err)\n\n            if scale is None:\n                self._scales[var] = Scale._identity()\n            else:\n                self._scales[var] = scale._setup(var_df[var], prop)\n\n            # Everything below here applies only to coordinate variables\n            # We additionally skip it when we're working with a value\n            # that is derived from a coordinate we've already processed.\n            # e.g., the Stat consumed y and added ymin/ymax. In that case,\n            # we've already setup the y scale and ymin/max are in scale space.\n            if axis is None or (var != coord and coord in p._variables):\n                continue\n\n            # Set up an empty series to receive the transformed values.\n            # We need this to handle piecemeal transforms of categories -> floats.\n            transformed_data = []\n            for layer in layers:\n                index = layer[\"data\"].frame.index\n                empty_series = pd.Series(dtype=float, index=index, name=var)\n                transformed_data.append(empty_series)\n\n            for view in subplots:\n\n                axis_obj = getattr(view[\"ax\"], f\"{axis}axis\")\n                seed_values = self._get_subplot_data(var_df, var, view, share_state)\n                view_scale = scale._setup(seed_values, prop, axis=axis_obj)\n                set_scale_obj(view[\"ax\"], axis, view_scale._matplotlib_scale)\n\n                for layer, new_series in zip(layers, transformed_data):\n                    layer_df = layer[\"data\"].frame\n                    if var in layer_df:\n                        idx = self._get_subplot_index(layer_df, view)\n                        new_series.loc[idx] = view_scale(layer_df.loc[idx, var])\n\n            # Now the transformed data series are complete, set update the layer data\n            for layer, new_series in zip(layers, transformed_data):\n                layer_df = layer[\"data\"].frame\n                if var in layer_df:\n                    layer_df[var] = new_series"
        },
        {
          "file": "seaborn/_core/subplots.py",
          "type": "function",
          "name": "_determine_axis_sharing",
          "class_name": "Subplots",
          "code": "def _determine_axis_sharing(self, pair_spec: PairSpec) -> None:\n        \"\"\"Update subplot spec with default or specified axis sharing parameters.\"\"\"\n        axis_to_dim = {\"x\": \"col\", \"y\": \"row\"}\n        key: str\n        val: str | bool\n        for axis in \"xy\":\n            key = f\"share{axis}\"\n            # Always use user-specified value, if present\n            if key not in self.subplot_spec:\n                if axis in pair_spec.get(\"structure\", {}):\n                    # Paired axes are shared along one dimension by default\n                    if self.wrap in [None, 1] and pair_spec.get(\"cross\", True):\n                        val = axis_to_dim[axis]\n                    else:\n                        val = False\n                else:\n                    # This will pick up faceted plots, as well as single subplot\n                    # figures, where the value doesn't really matter\n                    val = True\n                self.subplot_spec[key] = val"
        }
      ]
    },
    {
      "pr_number": 2379,
      "pr_title": "FIX: Infer categorical dtypes before boolean resolution",
      "pr_body": "Fixes #2317, with small changes to the docstring of `variable_type`.",
      "issue_id": 2317,
      "issue_title": "Categorical variable with numerical classes incorrectly plotted only on y axis",
      "issue_body": "Dear All,\r\n\r\n\r\nI think I may have found a bug in Seaborn categorical plotting functions.\r\nIf a DataFrame column contains numbers, and it is explicitely converted to CategoricalDType, it will be correctly treated as categorical by functions such as boxplot only if it is passed to `x` argument.\r\nIf it is instead passed to `y` argument of the plotting function, it will be treated as numerical, and the other variable will be treated as categorical (even though the other variable is obviously numerical).\r\n\r\nI am using Python 3.7, Matplotlib 3.3.1, Seaborn 0.11, Numpy 1.19.1, and Pandas 1.1.1 .\r\nI am using Matplotlib backend: 'module://ipykernel.pylab.backend_inline'\r\n\r\n\r\nReproducible code:\r\n```python\r\n\r\n#Create DataFrame with a numerical column, and a categorical column with number as classes.\r\nn_points = 50\r\n\r\ndf = pd.DataFrame({\"value\": np.random.rand(n_points),\r\n                   \"class\": np.random.randint(0, 2, n_points),\r\n                   })\r\n\r\n#Explicitely set `class` column to categorical data type.\r\ndf[\"class\"] = df[\"class\"].astype(\"category\")\r\n\r\n#If `class` column is passed to `x` argument, the plot is correct: column is treated as categorical.\r\nsns.boxplot(data=df,\r\n            x=\"class\",\r\n            y=\"value\",\r\n            );\r\n\r\n#BUG: If `class` column is passed to `y` argument, the plot is incorrect: `class` is treated as numerical!\r\nsns.boxplot(data=df,\r\n            x=\"value\",\r\n            y=\"class\",\r\n            );\r\n\r\n```\r\n\r\nPlease take a look at\r\n[bug_categorical_numbers.pdf](https://github.com/mwaskom/seaborn/files/5371402/bug_categorical_numbers.pdf)\r\n the attached PDF file with the correct and wrong plots.",
      "issue_closed_at": "2020-12-12T14:22:35Z",
      "base_commit": "ae123d79ed341d352d3f29b6936c044350b75e86",
      "changes": [
        {
          "file": "seaborn/_core.py",
          "type": "function",
          "name": "_add_axis_labels",
          "class_name": "VectorPlotter",
          "code": "def _add_axis_labels(self, ax, default_x=\"\", default_y=\"\"):\n        \"\"\"Add axis labels if not present, set visibility to match ticklabels.\"\"\"\n        # TODO ax could default to None and use attached axes if present\n        # but what to do about the case of facets? Currently using FacetGrid's\n        # set_axis_labels method, which doesn't add labels to the interior even\n        # when the axes are not shared. Maybe that makes sense?\n        if not ax.get_xlabel():\n            x_visible = any(t.get_visible() for t in ax.get_xticklabels())\n            ax.set_xlabel(self.variables.get(\"x\", default_x), visible=x_visible)\n        if not ax.get_ylabel():\n            y_visible = any(t.get_visible() for t in ax.get_yticklabels())\n            ax.set_ylabel(self.variables.get(\"y\", default_y), visible=y_visible)"
        },
        {
          "file": "seaborn/_core.py",
          "type": "function",
          "name": "variable_type",
          "class_name": null,
          "code": "def variable_type(vector, boolean_type=\"numeric\"):\n    \"\"\"Determine whether a vector contains numeric, categorical, or dateime data.\n\n    This function differs from the pandas typing API in two ways:\n\n    - Python sequences or object-typed PyData objects are considered numeric if\n      all of their entries are numeric.\n    - String or mixed-type data are considered categorical even if not\n      explicitly represented as a :class:pandas.api.types.CategoricalDtype`.\n\n    Parameters\n    ----------\n    vector : :func:`pandas.Series`, :func:`numpy.ndarray`, or Python sequence\n        Input data to test.\n    binary_type : 'numeric' or 'categorical'\n        Type to use for vectors containing only 0s and 1s (and NAs).\n\n    Returns\n    -------\n    var_type : 'numeric', 'categorical', or 'datetime'\n        Name identifying the type of data in the vector.\n\n    \"\"\"\n    # Special-case all-na data, which is always \"numeric\"\n    if pd.isna(vector).all():\n        return \"numeric\"\n\n    # Special-case binary/boolean data, allow caller to determine\n    # This triggers a numpy warning when vector has strings/objects\n    # https://github.com/numpy/numpy/issues/6784\n    # Because we reduce with .all(), we are agnostic about whether the\n    # comparison returns a scalar or vector, so we will ignore the warning.\n    # It triggers a separate DeprecationWarning when the vector has datetimes:\n    # https://github.com/numpy/numpy/issues/13548\n    # This is considered a bug by numpy and will likely go away.\n    with warnings.catch_warnings():\n        warnings.simplefilter(\n            action='ignore', category=(FutureWarning, DeprecationWarning)\n        )\n        if np.isin(vector, [0, 1, np.nan]).all():\n            return boolean_type\n\n    # Defer to positive pandas tests\n    if pd.api.types.is_numeric_dtype(vector):\n        return \"numeric\"\n\n    if pd.api.types.is_categorical_dtype(vector):\n        return \"categorical\"\n\n    if pd.api.types.is_datetime64_dtype(vector):\n        return \"datetime\"\n\n    # --- If we get to here, we need to check the entries\n\n    # Check for a collection where everything is a number\n\n    def all_numeric(x):\n        for x_i in x:\n            if not isinstance(x_i, Number):\n                return False\n        return True\n\n    if all_numeric(vector):\n        return \"numeric\"\n\n    # Check for a collection where everything is a datetime\n\n    def all_datetime(x):\n        for x_i in x:\n            if not isinstance(x_i, (datetime, np.datetime64)):\n                return False\n        return True\n\n    if all_datetime(vector):\n        return \"datetime\"\n\n    # Otherwise, our final fallback is to consider things categorical\n\n    return \"categorical\""
        }
      ]
    }
  ]
}