{
  "instance_id": "pydata__xarray-3364",
  "repo": "pydata/xarray",
  "created_at": "2019-10-01T21:15:54Z",
  "problem_statement": "Ignore missing variables when concatenating datasets?\nSeveral users (@raj-kesavan, @richardotis, now myself) have wondered about how to concatenate xray Datasets with different variables.\n\nWith the current `xray.concat`, you need to awkwardly create dummy variables filled with `NaN` in datasets that don't have them (or drop mismatched variables entirely). Neither of these are great options -- `concat` should have an option (the default?) to take care of this for the user.\n\nThis would also be more consistent with `pd.concat`, which takes a more relaxed approach to matching dataframes with different variables (it does an outer join).\n\n",
  "patch": "diff --git a/xarray/core/concat.py b/xarray/core/concat.py\n--- a/xarray/core/concat.py\n+++ b/xarray/core/concat.py\n@@ -312,15 +312,9 @@ def _dataset_concat(\n         to_merge = {var: [] for var in variables_to_merge}\n \n         for ds in datasets:\n-            absent_merge_vars = variables_to_merge - set(ds.variables)\n-            if absent_merge_vars:\n-                raise ValueError(\n-                    \"variables %r are present in some datasets but not others. \"\n-                    % absent_merge_vars\n-                )\n-\n             for var in variables_to_merge:\n-                to_merge[var].append(ds.variables[var])\n+                if var in ds:\n+                    to_merge[var].append(ds.variables[var])\n \n         for var in variables_to_merge:\n             result_vars[var] = unique_variable(\n",
  "similar_bug_items": [
    {
      "pr_number": 3028,
      "pr_title": "Add \"errors\" keyword argument to drop() and drop_dims() (#2994)",
      "pr_body": "<!-- Feel free to remove check-list items aren't relevant to your change -->\r\n\r\n - [x] Closes #2994 \r\n - [x] Tests added\r\n - [x] Fully documented, including `whats-new.rst` for all changes and `api.rst` for new API\r\n\r\nThis addresses #2994 by adding an \"errors\" keyword argument to `Dataset.drop()`, `Dataset.drop_dims()`, and `DataArray.drop()`. \r\n\r\nI stuck with pandas' convention of using either `errors='raise'`, now the default that maintains previous behavior by raising an error if any passed label is not found in the dataset/array, or `errors='ignore'` in which case any missing labels are silently ignored. \r\n\r\nThis seems like a pretty straightforward change; mainly it is just skipping checks for missing labels when `errors == 'ignore'` and passing the errors keyword over to the pandas method when using `index.drop()`. Hopefully there are no subtleties that I've missed. \r\n\r\nI added documentation to the appropriate methods, although I have been struggling to build the docs locally and am unsure if they look right.\r\n\r\nAlso this is my first attempt to contribute to any project, so suggestions and feedback are welcome. ",
      "issue_id": 2994,
      "issue_title": "xr.Dataset.drop",
      "issue_body": "Currently, `drop` throws an error if one of the labels doesn't exist. It would be nice to have a parameter in the drop method for optionally ignoring errors like in the pandas.DataFrame.\r\nFrom the pandas [documentation](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.drop.html):\r\n\r\n> errors : {\u2018ignore\u2019, \u2018raise\u2019}, default \u2018raise\u2019\r\n>     If \u2018ignore\u2019, suppress error and only existing labels are dropped.\r\n",
      "issue_closed_at": "2019-06-20T15:48:00Z",
      "base_commit": "c2a2a6efcaf2d279c78da4ba3a87ea96afe78be0",
      "changes": [
        {
          "file": "xarray/core/dataarray.py",
          "type": "function",
          "name": "transpose",
          "class_name": "DataArray",
          "code": "def transpose(self, *dims, transpose_coords=None) -> 'DataArray':\n        \"\"\"Return a new DataArray object with transposed dimensions.\n\n        Parameters\n        ----------\n        *dims : str, optional\n            By default, reverse the dimensions. Otherwise, reorder the\n            dimensions to this order.\n        transpose_coords : boolean, optional\n            If True, also transpose the coordinates of this DataArray.\n\n        Returns\n        -------\n        transposed : DataArray\n            The returned DataArray's array is transposed.\n\n        Notes\n        -----\n        This operation returns a view of this array's data. It is\n        lazy for dask-backed DataArrays but not for numpy-backed DataArrays\n        -- the data will be fully loaded.\n\n        See Also\n        --------\n        numpy.transpose\n        Dataset.transpose\n        \"\"\"\n        if dims:\n            if set(dims) ^ set(self.dims):\n                raise ValueError('arguments to transpose (%s) must be '\n                                 'permuted array dimensions (%s)'\n                                 % (dims, tuple(self.dims)))\n\n        variable = self.variable.transpose(*dims)\n        if transpose_coords:\n            coords = {}\n            for name, coord in self.coords.items():\n                coord_dims = tuple(dim for dim in dims if dim in coord.dims)\n                coords[name] = coord.variable.transpose(*coord_dims)\n            return self._replace(variable, coords)\n        else:\n            if transpose_coords is None \\\n                    and any(self[c].ndim > 1 for c in self.coords):\n                warnings.warn('This DataArray contains multi-dimensional '\n                              'coordinates. In the future, these coordinates '\n                              'will be transposed as well unless you specify '\n                              'transpose_coords=False.',\n                              FutureWarning, stacklevel=2)\n            return self._replace(variable)"
        },
        {
          "file": "xarray/core/dataarray.py",
          "type": "function",
          "name": "drop",
          "class_name": "DataArray",
          "code": "def drop(self, labels, dim=None):\n        \"\"\"Drop coordinates or index labels from this DataArray.\n\n        Parameters\n        ----------\n        labels : scalar or list of scalars\n            Name(s) of coordinate variables or index labels to drop.\n        dim : str, optional\n            Dimension along which to drop index labels. By default (if\n            ``dim is None``), drops coordinates rather than index labels.\n\n        Returns\n        -------\n        dropped : DataArray\n        \"\"\"\n        if utils.is_scalar(labels):\n            labels = [labels]\n        ds = self._to_temp_dataset().drop(labels, dim)\n        return self._from_temp_dataset(ds)"
        },
        {
          "file": "xarray/core/dataset.py",
          "type": "function",
          "name": "_assert_all_in_dataset",
          "class_name": "Dataset",
          "code": "def _assert_all_in_dataset(self, names, virtual_okay=False):\n        bad_names = set(names) - set(self._variables)\n        if virtual_okay:\n            bad_names -= self.virtual_variables\n        if bad_names:\n            raise ValueError('One or more of the specified variables '\n                             'cannot be found in this dataset')"
        },
        {
          "file": "xarray/core/dataset.py",
          "type": "function",
          "name": "drop",
          "class_name": "Dataset",
          "code": "def drop(self, labels, dim=None):\n        \"\"\"Drop variables or index labels from this dataset.\n\n        Parameters\n        ----------\n        labels : scalar or list of scalars\n            Name(s) of variables or index labels to drop.\n        dim : None or str, optional\n            Dimension along which to drop index labels. By default (if\n            ``dim is None``), drops variables rather than index labels.\n\n        Returns\n        -------\n        dropped : Dataset\n        \"\"\"\n        if utils.is_scalar(labels):\n            labels = [labels]\n        if dim is None:\n            return self._drop_vars(labels)\n        else:\n            try:\n                index = self.indexes[dim]\n            except KeyError:\n                raise ValueError(\n                    'dimension %r does not have coordinate labels' % dim)\n            new_index = index.drop(labels)\n            return self.loc[{dim: new_index}]"
        },
        {
          "file": "xarray/core/dataset.py",
          "type": "function",
          "name": "drop_dims",
          "class_name": "Dataset",
          "code": "def drop_dims(self, drop_dims):\n        \"\"\"Drop dimensions and associated variables from this dataset.\n\n        Parameters\n        ----------\n        drop_dims : str or list\n            Dimension or dimensions to drop.\n\n        Returns\n        -------\n        obj : Dataset\n            The dataset without the given dimensions (or any variables\n            containing those dimensions)\n        \"\"\"\n        if utils.is_scalar(drop_dims):\n            drop_dims = [drop_dims]\n\n        missing_dimensions = [d for d in drop_dims if d not in self.dims]\n        if missing_dimensions:\n            raise ValueError('Dataset does not contain the dimensions: %s'\n                             % missing_dimensions)\n\n        drop_vars = set(k for k, v in self._variables.items()\n                        for d in v.dims if d in drop_dims)\n\n        variables = OrderedDict((k, v) for k, v in self._variables.items()\n                                if k not in drop_vars)\n        coord_names = set(k for k in self._coord_names if k in variables)\n\n        return self._replace_with_new_dims(variables, coord_names)"
        }
      ]
    },
    {
      "pr_number": 219,
      "pr_title": "Fix concat str truncation",
      "pr_body": "Fixes #217.\n\nI also took the opportunity to add two small optimizations, which add up to make `Variable.concat` about 35% faster.\n",
      "issue_id": 217,
      "issue_title": "Strings are truncated when concatenating Datasets.",
      "issue_body": "When concatenating Datasets, a variable's string length is limited to the length in the first of the Datasets being concatenated.\n\n```\n>>> import xray\n>>> first = xray.Dataset({'animal': ('animal', ['horse'])})\n>>> second = xray.Dataset( {'animal': ('animal', ['aardvark_0'])})\n>>> xray.Dataset.concat([first, second], dimension='animal')['animal']\n<xray.DataArray 'animal' (animal: 2)>\narray(['horse', 'aardv'], \n      dtype='|S5')\nCoordinates:\n    animal: Index([u'horse', u'aardv'], dtype='object')\nAttributes:\n    Empty\n```\n\n(Note the `|S5` dtype and the truncated `aardv`)\n\nI think this is the offending line: https://github.com/xray/xray/blob/master/xray/core/variable.py#L623\nMay want to use `dtype=object` for strings to avoid this issue.\n",
      "issue_closed_at": "2014-08-21T05:17:28Z",
      "base_commit": "4a9f283fdb2b4c7588a8ca373e9f3cb9af401bf4",
      "changes": [
        {
          "file": "xray/core/variable.py",
          "type": "function",
          "name": "concat",
          "class_name": "Variable",
          "code": "def concat(cls, variables, dim='concat_dim', indexers=None, length=None,\n               shortcut=False):\n        \"\"\"Concatenate variables along a new or existing dimension.\n\n        Parameters\n        ----------\n        variables : iterable of Array\n            Arrays to stack together. Each variable is expected to have\n            matching dimensions and shape except for along the stacked\n            dimension.\n        dim : str or DataArray, optional\n            Name of the dimension to stack along. This can either be a new\n            dimension name, in which case it is added along axis=0, or an\n            existing dimension name, in which case the location of the\n            dimension is unchanged. Where to insert the new dimension is\n            determined by the first variable.\n        indexers : iterable of indexers, optional\n            Iterable of indexers of the same length as variables which\n            specifies how to assign variables along the given dimension. If\n            not supplied, indexers is inferred from the length of each\n            variable along the dimension, and the variables are stacked in the\n            given order.\n        length : int, optional\n            Length of the new dimension. This is used to allocate the new data\n            array for the stacked variable data before iterating over all\n            items, which is thus more memory efficient and a bit faster. If\n            dimension is provided as a DataArray, length is calculated\n            automatically.\n        shortcut : bool, optional\n            This option is used internally to speed-up groupby operations.\n            If `shortcut` is True, some checks of internal consistency between\n            arrays to concatenate are skipped.\n\n        Returns\n        -------\n        stacked : Variable\n            Concatenated Variable formed by stacking all the supplied variables\n            along the given dimension.\n        \"\"\"\n        if not isinstance(dim, basestring):\n            length = dim.size\n            dim, = dim.dims\n\n        if length is None or indexers is None:\n            # so much for lazy evaluation! we need to look at all the variables\n            # to figure out the indexers and/or dimensions of the stacked\n            # variable\n            variables = list(variables)\n            steps = [var.shape[var.get_axis_num(dim)]\n                     if dim in var.dims else 1\n                     for var in variables]\n            if length is None:\n                length = sum(steps)\n            if indexers is None:\n                indexers = []\n                i = 0\n                for step in steps:\n                    indexers.append(slice(i, i + step))\n                    i += step\n                if i != length:\n                    raise ValueError('actual length of stacked variables '\n                                     'along %s is %r but expected length was '\n                                     '%s' % (dim, i, length))\n\n        # initialize the stacked variable with empty data\n        from . import groupby\n        first_var, variables = groupby.peek_at(variables)\n        if dim in first_var.dims:\n            axis = first_var.get_axis_num(dim)\n            shape = tuple(length if n == axis else s\n                          for n, s in enumerate(first_var.shape))\n            dims = first_var.dims\n        else:\n            axis = 0\n            shape = (length,) + first_var.shape\n            dims = (dim,) + first_var.dims\n\n        concatenated = cls(dims, np.empty(shape, dtype=first_var.dtype))\n        concatenated.attrs.update(first_var.attrs)\n\n        alt_dims = tuple(d for d in dims if d != dim)\n\n        # copy in the data from the variables\n        for var, indexer in zip(variables, indexers):\n            if not shortcut:\n                # do sanity checks & attributes clean-up\n                if dim in var.dims:\n                    # transpose verifies that the dims are equivalent\n                    if var.dims != concatenated.dims:\n                        var = var.transpose(*concatenated.dims)\n                elif var.dims != alt_dims:\n                    raise ValueError('inconsistent dimensions')\n                utils.remove_incompatible_items(concatenated.attrs, var.attrs)\n\n            key = tuple(indexer if n == axis else slice(None)\n                        for n in range(concatenated.ndim))\n            concatenated.values[key] = var.values\n\n        return concatenated"
        },
        {
          "file": "xray/core/variable.py",
          "type": "function",
          "name": "concat",
          "class_name": "Variable",
          "code": "def concat(cls, variables, dim='concat_dim', indexers=None, length=None,\n               shortcut=False):\n        \"\"\"Concatenate variables along a new or existing dimension.\n\n        Parameters\n        ----------\n        variables : iterable of Array\n            Arrays to stack together. Each variable is expected to have\n            matching dimensions and shape except for along the stacked\n            dimension.\n        dim : str or DataArray, optional\n            Name of the dimension to stack along. This can either be a new\n            dimension name, in which case it is added along axis=0, or an\n            existing dimension name, in which case the location of the\n            dimension is unchanged. Where to insert the new dimension is\n            determined by the first variable.\n        indexers : iterable of indexers, optional\n            Iterable of indexers of the same length as variables which\n            specifies how to assign variables along the given dimension. If\n            not supplied, indexers is inferred from the length of each\n            variable along the dimension, and the variables are stacked in the\n            given order.\n        length : int, optional\n            Length of the new dimension. This is used to allocate the new data\n            array for the stacked variable data before iterating over all\n            items, which is thus more memory efficient and a bit faster. If\n            dimension is provided as a DataArray, length is calculated\n            automatically.\n        shortcut : bool, optional\n            This option is used internally to speed-up groupby operations.\n            If `shortcut` is True, some checks of internal consistency between\n            arrays to concatenate are skipped.\n\n        Returns\n        -------\n        stacked : Variable\n            Concatenated Variable formed by stacking all the supplied variables\n            along the given dimension.\n        \"\"\"\n        if not isinstance(dim, basestring):\n            length = dim.size\n            dim, = dim.dims\n\n        if length is None or indexers is None:\n            # so much for lazy evaluation! we need to look at all the variables\n            # to figure out the indexers and/or dimensions of the stacked\n            # variable\n            variables = list(variables)\n            steps = [var.shape[var.get_axis_num(dim)]\n                     if dim in var.dims else 1\n                     for var in variables]\n            if length is None:\n                length = sum(steps)\n            if indexers is None:\n                indexers = []\n                i = 0\n                for step in steps:\n                    indexers.append(slice(i, i + step))\n                    i += step\n                if i != length:\n                    raise ValueError('actual length of stacked variables '\n                                     'along %s is %r but expected length was '\n                                     '%s' % (dim, i, length))\n\n        # initialize the stacked variable with empty data\n        from . import groupby\n        first_var, variables = groupby.peek_at(variables)\n        if dim in first_var.dims:\n            axis = first_var.get_axis_num(dim)\n            shape = tuple(length if n == axis else s\n                          for n, s in enumerate(first_var.shape))\n            dims = first_var.dims\n        else:\n            axis = 0\n            shape = (length,) + first_var.shape\n            dims = (dim,) + first_var.dims\n\n        concatenated = cls(dims, np.empty(shape, dtype=first_var.dtype))\n        concatenated.attrs.update(first_var.attrs)\n\n        alt_dims = tuple(d for d in dims if d != dim)\n\n        # copy in the data from the variables\n        for var, indexer in zip(variables, indexers):\n            if not shortcut:\n                # do sanity checks & attributes clean-up\n                if dim in var.dims:\n                    # transpose verifies that the dims are equivalent\n                    if var.dims != concatenated.dims:\n                        var = var.transpose(*concatenated.dims)\n                elif var.dims != alt_dims:\n                    raise ValueError('inconsistent dimensions')\n                utils.remove_incompatible_items(concatenated.attrs, var.attrs)\n\n            key = tuple(indexer if n == axis else slice(None)\n                        for n in range(concatenated.ndim))\n            concatenated.values[key] = var.values\n\n        return concatenated"
        }
      ]
    },
    {
      "pr_number": 598,
      "pr_title": "Fix colormap for facet grid plots",
      "pr_body": "Fixes #592\n\nAdded test to check that all subplots in facet grid have same data range and colormap.\n\nThis fixes two issues present in the existing code: \n\n1) colormap was being selected for each subplot\n2) range was being selected for each subplot and colorbar was the result of only the last subplot\n\nSome sample code: \n\n``` Python\ndata = (np.random.random(size=(20, 25, 12)) + np.linspace(-3, 3, 12)) # range is ~ -3 to 4\nda = xray.DataArray(data, dims=['x', 'y', 'time'], name='data')\nfg = da.plot.pcolormesh(col='time', col_wrap=4)\n```\n\npreviously yielded this plot:\n![broken](https://cloud.githubusercontent.com/assets/2443309/10212715/f752a92e-67b7-11e5-8477-f5fc877fe716.png)\n\nand now yields this plot:\n![fixed](https://cloud.githubusercontent.com/assets/2443309/10212716/000fe1f8-67b8-11e5-8265-7ce2a89f8fa4.png)\n",
      "issue_id": 592,
      "issue_title": "Faceted plots can pick different colormaps for different facets",
      "issue_body": "For example:\n\n```\nds.tmin.plot.imshow(col='T', col_wrap=4)\n```\n\n![image](https://cloud.githubusercontent.com/assets/1217238/10151810/47551696-6600-11e5-85af-5c985468d6d5.png)\n\nWe should make sure the default logic doesn't do this.\n",
      "issue_closed_at": "2015-10-01T17:10:31Z",
      "base_commit": "1ec0e3592be5e9136824144809aa763499134ec7",
      "changes": [
        {
          "file": "xray/plot/facetgrid.py",
          "type": "function",
          "name": "__init__",
          "class_name": "FacetGrid",
          "code": "def __init__(self, data, col=None, row=None, col_wrap=None,\n                 aspect=1, size=3):\n        \"\"\"\n        Parameters\n        ----------\n        data : DataArray\n            xray DataArray to be plotted\n        row, col : strings\n            Dimesion names that define subsets of the data, which will be drawn\n            on separate facets in the grid.\n        col_wrap : int, optional\n            \"Wrap\" the column variable at this width, so that the column facets\n        aspect : scalar, optional\n            Aspect ratio of each facet, so that ``aspect * size`` gives the\n            width of each facet in inches\n        size : scalar, optional\n            Height (in inches) of each facet. See also: ``aspect``\n\n        \"\"\"\n\n        import matplotlib.pyplot as plt\n\n        # Handle corner case of nonunique coordinates\n        rep_col = col is not None and not data[col].to_index().is_unique\n        rep_row = row is not None and not data[row].to_index().is_unique\n        if rep_col or rep_row:\n            raise ValueError('Coordinates used for faceting cannot '\n                             'contain repeated (nonunique) values.')\n\n        # single_group is the grouping variable, if there is exactly one\n        if col and row:\n            single_group = False\n            nrow = len(data[row])\n            ncol = len(data[col])\n            nfacet = nrow * ncol\n            if col_wrap is not None:\n                warnings.warn('Ignoring col_wrap since both col and row '\n                              'were passed')\n        elif row and not col:\n            single_group = row\n        elif not row and col:\n            single_group = col\n        else:\n            raise ValueError(\n                'Pass a coordinate name as an argument for row or col')\n\n        # Compute grid shape\n        if single_group:\n            nfacet = len(data[single_group])\n            if col:\n                # idea - could add heuristic for nice shapes like 3x4\n                ncol = nfacet\n            if row:\n                ncol = 1\n            if col_wrap is not None:\n                # Overrides previous settings\n                ncol = col_wrap\n            nrow = int(np.ceil(nfacet / ncol))\n\n        # Calculate the base figure size with extra horizontal space for a\n        # colorbar\n        cbar_space = 1\n        figsize = (ncol * size * aspect + cbar_space, nrow * size)\n\n        fig, axes = plt.subplots(nrow, ncol,\n                                 sharex=True, sharey=True,\n                                 squeeze=False, figsize=figsize)\n\n        # Set up the lists of names for the row and column facet variables\n        col_names = list(data[col].values) if col else []\n        row_names = list(data[row].values) if row else []\n\n        if single_group:\n            full = [{single_group: x} for x in\n                    data[single_group].values]\n            empty = [None for x in range(nrow * ncol - len(full))]\n            name_dicts = full + empty\n        else:\n            rowcols = itertools.product(row_names, col_names)\n            name_dicts = [{row: r, col: c} for r, c in rowcols]\n\n        name_dicts = np.array(name_dicts).reshape(nrow, ncol)\n\n        # Set up the class attributes\n        # ---------------------------\n\n        # First the public API\n        self.data = data\n        self.name_dicts = name_dicts\n        self.fig = fig\n        self.axes = axes\n        self.row_names = row_names\n        self.col_names = col_names\n\n        # Next the private variables\n        self._single_group = single_group\n        self._nrow = nrow\n        self._row_var = row\n        self._ncol = ncol\n        self._col_var = col\n        self._col_wrap = col_wrap\n        self._x_var = None\n        self._y_var = None\n\n        self.set_titles()"
        },
        {
          "file": "xray/plot/facetgrid.py",
          "type": "function",
          "name": "map_dataarray",
          "class_name": "FacetGrid",
          "code": "def map_dataarray(self, func, x, y, **kwargs):\n        \"\"\"\n        Apply a plotting function to a 2d facet's subset of the data.\n\n        This is more convenient and less general than ``FacetGrid.map``\n\n        Parameters\n        ----------\n        func : callable\n            A plotting function with the same signature as a 2d xray\n            plotting method such as `xray.plot.imshow`\n        x, y : string\n            Names of the coordinates to plot on x, y axes\n        kwargs :\n            additional keyword arguments to func\n\n        Returns\n        -------\n        self : FacetGrid object\n\n        \"\"\"\n\n        # These should be consistent with xray.plot._plot2d\n        cmap_kwargs = {'plot_data': self.data.values,\n                       'vmin': None,\n                       'vmax': None,\n                       'cmap': None,\n                       'center': None,\n                       'robust': False,\n                       'extend': None,\n                       # MPL default\n                       'levels': 7 if 'contour' in func.__name__ else None,\n                       'filled': func.__name__ != 'contour',\n                       }\n\n        # Allow kwargs to override these defaults\n        for param in kwargs:\n            if param in cmap_kwargs:\n                cmap_kwargs[param] = kwargs[param]\n\n        # colormap inference has to happen here since all the data in\n        # self.data is required to make the right choice\n        cmap_params = _determine_cmap_params(**cmap_kwargs)\n\n        if 'contour' in func.__name__:\n            # extend is a keyword argument only for contour and contourf, but\n            # passing it to the colorbar is sufficient for imshow and\n            # pcolormesh\n            kwargs['extend'] = cmap_params['extend']\n            kwargs['levels'] = cmap_params['levels']\n\n        defaults = {\n            'add_colorbar': False,\n            'add_labels': False,\n            'norm': cmap_params.pop('cnorm'),\n        }\n\n        # Order is important\n        defaults.update(cmap_params)\n        defaults.update(kwargs)\n\n        for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n            # None is the sentinel value\n            if d is not None:\n                subset = self.data.loc[d]\n                mappable = func(subset, x, y, ax=ax, **defaults)\n\n        # Left side labels\n        for ax in self.axes[:, 0]:\n            ax.set_ylabel(y)\n\n        # Bottom labels\n        for ax in self.axes[-1, :]:\n            ax.set_xlabel(x)\n\n        self.fig.tight_layout()\n\n        if self._single_group:\n            for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n                if d is None:\n                    ax.set_visible(False)\n\n        # colorbar\n        if kwargs.get('add_colorbar', True):\n            cbar = self.fig.colorbar(mappable,\n                                     ax=list(self.axes.flat),\n                                     extend=cmap_params['extend'])\n\n            if self.data.name:\n                cbar.set_label(self.data.name, rotation=270,\n                               verticalalignment='bottom')\n\n        self._x_var = x\n        self._y_var = y\n\n        return self"
        },
        {
          "file": "xray/plot/facetgrid.py",
          "type": "function",
          "name": "map_dataarray",
          "class_name": "FacetGrid",
          "code": "def map_dataarray(self, func, x, y, **kwargs):\n        \"\"\"\n        Apply a plotting function to a 2d facet's subset of the data.\n\n        This is more convenient and less general than ``FacetGrid.map``\n\n        Parameters\n        ----------\n        func : callable\n            A plotting function with the same signature as a 2d xray\n            plotting method such as `xray.plot.imshow`\n        x, y : string\n            Names of the coordinates to plot on x, y axes\n        kwargs :\n            additional keyword arguments to func\n\n        Returns\n        -------\n        self : FacetGrid object\n\n        \"\"\"\n\n        # These should be consistent with xray.plot._plot2d\n        cmap_kwargs = {'plot_data': self.data.values,\n                       'vmin': None,\n                       'vmax': None,\n                       'cmap': None,\n                       'center': None,\n                       'robust': False,\n                       'extend': None,\n                       # MPL default\n                       'levels': 7 if 'contour' in func.__name__ else None,\n                       'filled': func.__name__ != 'contour',\n                       }\n\n        # Allow kwargs to override these defaults\n        for param in kwargs:\n            if param in cmap_kwargs:\n                cmap_kwargs[param] = kwargs[param]\n\n        # colormap inference has to happen here since all the data in\n        # self.data is required to make the right choice\n        cmap_params = _determine_cmap_params(**cmap_kwargs)\n\n        if 'contour' in func.__name__:\n            # extend is a keyword argument only for contour and contourf, but\n            # passing it to the colorbar is sufficient for imshow and\n            # pcolormesh\n            kwargs['extend'] = cmap_params['extend']\n            kwargs['levels'] = cmap_params['levels']\n\n        defaults = {\n            'add_colorbar': False,\n            'add_labels': False,\n            'norm': cmap_params.pop('cnorm'),\n        }\n\n        # Order is important\n        defaults.update(cmap_params)\n        defaults.update(kwargs)\n\n        for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n            # None is the sentinel value\n            if d is not None:\n                subset = self.data.loc[d]\n                mappable = func(subset, x, y, ax=ax, **defaults)\n\n        # Left side labels\n        for ax in self.axes[:, 0]:\n            ax.set_ylabel(y)\n\n        # Bottom labels\n        for ax in self.axes[-1, :]:\n            ax.set_xlabel(x)\n\n        self.fig.tight_layout()\n\n        if self._single_group:\n            for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n                if d is None:\n                    ax.set_visible(False)\n\n        # colorbar\n        if kwargs.get('add_colorbar', True):\n            cbar = self.fig.colorbar(mappable,\n                                     ax=list(self.axes.flat),\n                                     extend=cmap_params['extend'])\n\n            if self.data.name:\n                cbar.set_label(self.data.name, rotation=270,\n                               verticalalignment='bottom')\n\n        self._x_var = x\n        self._y_var = y\n\n        return self"
        },
        {
          "file": "xray/plot/facetgrid.py",
          "type": "function",
          "name": "map_dataarray",
          "class_name": "FacetGrid",
          "code": "def map_dataarray(self, func, x, y, **kwargs):\n        \"\"\"\n        Apply a plotting function to a 2d facet's subset of the data.\n\n        This is more convenient and less general than ``FacetGrid.map``\n\n        Parameters\n        ----------\n        func : callable\n            A plotting function with the same signature as a 2d xray\n            plotting method such as `xray.plot.imshow`\n        x, y : string\n            Names of the coordinates to plot on x, y axes\n        kwargs :\n            additional keyword arguments to func\n\n        Returns\n        -------\n        self : FacetGrid object\n\n        \"\"\"\n\n        # These should be consistent with xray.plot._plot2d\n        cmap_kwargs = {'plot_data': self.data.values,\n                       'vmin': None,\n                       'vmax': None,\n                       'cmap': None,\n                       'center': None,\n                       'robust': False,\n                       'extend': None,\n                       # MPL default\n                       'levels': 7 if 'contour' in func.__name__ else None,\n                       'filled': func.__name__ != 'contour',\n                       }\n\n        # Allow kwargs to override these defaults\n        for param in kwargs:\n            if param in cmap_kwargs:\n                cmap_kwargs[param] = kwargs[param]\n\n        # colormap inference has to happen here since all the data in\n        # self.data is required to make the right choice\n        cmap_params = _determine_cmap_params(**cmap_kwargs)\n\n        if 'contour' in func.__name__:\n            # extend is a keyword argument only for contour and contourf, but\n            # passing it to the colorbar is sufficient for imshow and\n            # pcolormesh\n            kwargs['extend'] = cmap_params['extend']\n            kwargs['levels'] = cmap_params['levels']\n\n        defaults = {\n            'add_colorbar': False,\n            'add_labels': False,\n            'norm': cmap_params.pop('cnorm'),\n        }\n\n        # Order is important\n        defaults.update(cmap_params)\n        defaults.update(kwargs)\n\n        for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n            # None is the sentinel value\n            if d is not None:\n                subset = self.data.loc[d]\n                mappable = func(subset, x, y, ax=ax, **defaults)\n\n        # Left side labels\n        for ax in self.axes[:, 0]:\n            ax.set_ylabel(y)\n\n        # Bottom labels\n        for ax in self.axes[-1, :]:\n            ax.set_xlabel(x)\n\n        self.fig.tight_layout()\n\n        if self._single_group:\n            for d, ax in zip(self.name_dicts.flat, self.axes.flat):\n                if d is None:\n                    ax.set_visible(False)\n\n        # colorbar\n        if kwargs.get('add_colorbar', True):\n            cbar = self.fig.colorbar(mappable,\n                                     ax=list(self.axes.flat),\n                                     extend=cmap_params['extend'])\n\n            if self.data.name:\n                cbar.set_label(self.data.name, rotation=270,\n                               verticalalignment='bottom')\n\n        self._x_var = x\n        self._y_var = y\n\n        return self"
        }
      ]
    },
    {
      "pr_number": 477,
      "pr_title": "Bytes attributes are decoded to strings with engine='h5netcdf'",
      "pr_body": "Fixes #451\n",
      "issue_id": 451,
      "issue_title": "Conventions decoding should properly handle byte type attributes on Python 3",
      "issue_body": "This only appears with the h5netcdf backend (for now), because netCDF4-python decodes all string attributes to unicode on Python 3.\n\nWe might also fix this upstream in h5netcdf by copying this behavior from netCDF4-python.\n\nxref https://github.com/xray/xray/issues/444#issuecomment-117993960\n",
      "issue_closed_at": "2015-07-16T18:11:42Z",
      "base_commit": "7c9a2fe27794a9761319daa4dc90a7e4e19c795e",
      "changes": [
        {
          "file": "xray/backends/h5netcdf_.py",
          "type": "line",
          "name": "line 2",
          "code": "from .. import Variable\nfrom ..conventions import cf_encoder\nfrom ..core import indexing\nfrom ..core.utils import FrozenOrderedDict, close_on_error\nfrom ..core.pycompat import iteritems, basestring, unicode_type, OrderedDict\n\nfrom .common import AbstractWritableDataStore\nfrom .netCDF4_ import _nc4_group, _nc4_values_and_dtype\n\n\nclass H5NetCDFStore(AbstractWritableDataStore):\n    \"\"\"Store for reading and writing data via h5netcdf\n    \"\"\""
        },
        {
          "file": "xray/backends/h5netcdf_.py",
          "type": "function",
          "name": "store",
          "class_name": "H5NetCDFStore",
          "code": "def store(self, variables, attributes):\n        # All NetCDF files get CF encoded by default, without this attempting\n        # to write times, for example, would fail.\n        cf_variables, cf_attrs = cf_encoder(variables, attributes)\n        AbstractWritableDataStore.store(self, cf_variables, cf_attrs)"
        },
        {
          "file": "xray/backends/h5netcdf_.py",
          "type": "function",
          "name": "open_store_variable",
          "class_name": "H5NetCDFStore",
          "code": "def open_store_variable(self, var):\n        dimensions = var.dimensions\n        data = indexing.LazilyIndexedArray(var)\n        attributes = OrderedDict((k, var.getncattr(k))\n                                 for k in var.ncattrs())\n\n        # netCDF4 specific encoding\n        encoding = dict(var.filters())\n        chunking = var.chunking()\n        encoding['chunksizes'] = chunking if chunking != 'contiguous' else None\n\n        # save source so __repr__ can detect if it's local or not\n        encoding['source'] = self._filename\n\n        return Variable(dimensions, data, attributes, encoding)"
        }
      ]
    },
    {
      "pr_number": 715,
      "pr_title": "Error when attempting to assign using attribute style syntax",
      "pr_body": "This should fail noisily rather than silently:\n\n```\nds.foo = 12\n```\n\nFixes #656\nFixes #714\n",
      "issue_id": 714,
      "issue_title": "Setting a Dataset variable with dot notation fails silently",
      "issue_body": "On master:\n\n``` python\nIn [4]: xray.Dataset({'a': xray.DataArray(pd.np.random.rand(10,3))})\nOut[4]: \n<xray.Dataset>\nDimensions:  (dim_0: 10, dim_1: 3)\nCoordinates:\n  * dim_0    (dim_0) int64 0 1 2 3 4 5 6 7 8 9\n  * dim_1    (dim_1) int64 0 1 2\nData variables:\n    a        (dim_0, dim_1) float64 0.2804 0.4567 0.8415 0.1367 0.3122 ...\n\nIn [5]: ds=xray.Dataset({'a': xray.DataArray(pd.np.random.rand(10,3))})\n\nIn [6]: ds.a\nOut[6]: \n<xray.DataArray 'a' (dim_0: 10, dim_1: 3)>\narray([[ 0.19862294,  0.40265588,  0.07676118],\n       [ 0.54722942,  0.47329196,  0.64441943],\n       [ 0.73762014,  0.22396906,  0.9332979 ],\n       [ 0.89731023,  0.71694417,  0.11682691],\n       [ 0.04576582,  0.89288435,  0.87985685],\n       [ 0.57822961,  0.34463642,  0.19137506],\n       [ 0.41551206,  0.50255891,  0.62438694],\n       [ 0.62158645,  0.57294376,  0.39147308],\n       [ 0.83240172,  0.41756554,  0.89859381],\n       [ 0.408273  ,  0.97774586,  0.56584299]])\nCoordinates:\n  * dim_0    (dim_0) int64 0 1 2 3 4 5 6 7 8 9\n  * dim_1    (dim_1) int64 0 1 2\n\nIn [7]: ds.a=10\n\nIn [8]: ds.a\nOut[8]: 10\n\nIn [9]: ds\nOut[9]: \n<xray.Dataset>\nDimensions:  (dim_0: 10, dim_1: 3)\nCoordinates:\n  * dim_0    (dim_0) int64 0 1 2 3 4 5 6 7 8 9\n  * dim_1    (dim_1) int64 0 1 2\nData variables:\n    a        (dim_0, dim_1) float64 0.1986 0.4027 0.07676 0.5472 0.4733 ...\n```\n\nMost confusing when you set `ds.a` to a realistic value, such as `ds.a*2`\n",
      "issue_closed_at": "2016-01-12T18:50:26Z",
      "base_commit": "4be7088013e0b07bcc11e57bccbc9ec4d90c1a01",
      "changes": [
        {
          "file": "xray/core/common.py",
          "type": "function",
          "name": "_get_axis_num",
          "class_name": "AbstractArray",
          "code": "def _get_axis_num(self, dim):\n        try:\n            return self.dims.index(dim)\n        except ValueError:\n            raise ValueError(\"%r not found in array dimensions %r\" %\n                             (dim, self.dims))"
        },
        {
          "file": "xray/core/common.py",
          "type": "function",
          "name": "__getattr__",
          "class_name": "AttrAccessMixin",
          "code": "def __getattr__(self, name):\n        if name != '__setstate__':\n            # this avoids an infinite loop when pickle looks for the\n            # __setstate__ attribute before the xray object is initialized\n            for source in self._attr_sources:\n                with suppress(KeyError):\n                    return source[name]\n        raise AttributeError(\"%r object has no attribute %r\" %\n                             (type(self).__name__, name))"
        },
        {
          "file": "xray/core/dataarray.py",
          "type": "function",
          "name": "__init__",
          "class_name": "DataArray",
          "code": "def __init__(self, data, coords=None, dims=None, name=None,\n                 attrs=None, encoding=None, fastpath=False):\n        \"\"\"\n        Parameters\n        ----------\n        data : array_like\n            Values for this array. Must be an ``numpy.ndarray``, ndarray like,\n            or castable to an ``ndarray``. If a self-described xray or pandas\n            object, attempts are made to use this array's metadata to fill in\n            other unspecified arguments. A view of the array's data is used\n            instead of a copy if possible.\n        coords : sequence or dict of array_like objects, optional\n            Coordinates (tick labels) to use for indexing along each dimension.\n            If dict-like, should be a mapping from dimension names to the\n            corresponding coordinates.\n        dims : str or sequence of str, optional\n            Name(s) of the the data dimension(s). Must be either a string (only\n            for 1D data) or a sequence of strings with length equal to the\n            number of dimensions. If this argument is omitted, dimension names\n            are taken from ``coords`` (if possible) and otherwise default to\n            ``['dim_0', ... 'dim_n']``.\n        name : str or None, optional\n            Name of this array.\n        attrs : dict_like or None, optional\n            Attributes to assign to the new instance. By default, an empty\n            attribute dictionary is initialized.\n        encoding : dict_like or None, optional\n            Dictionary specifying how to encode this array's data into a\n            serialized format like netCDF4. Currently used keys (for netCDF)\n            include '_FillValue', 'scale_factor', 'add_offset', 'dtype',\n            'units' and 'calendar' (the later two only for datetime arrays).\n            Unrecognized keys are ignored.\n        \"\"\"\n        if fastpath:\n            variable = data\n            assert dims is None\n            assert attrs is None\n            assert encoding is None\n        else:\n            # try to fill in arguments from data if they weren't supplied\n            if coords is None:\n                coords = getattr(data, 'coords', None)\n                if isinstance(data, pd.Series):\n                    coords = [data.index]\n                elif isinstance(data, pd.DataFrame):\n                    coords = [data.index, data.columns]\n                elif isinstance(data, (pd.Index, Coordinate)):\n                    coords = [data]\n                elif isinstance(data, pd.Panel):\n                    coords = [data.items, data.major_axis, data.minor_axis]\n            if dims is None:\n                dims = getattr(data, 'dims', getattr(coords, 'dims', None))\n            if name is None:\n                name = getattr(data, 'name', None)\n            if attrs is None:\n                attrs = getattr(data, 'attrs', None)\n            if encoding is None:\n                encoding = getattr(data, 'encoding', None)\n\n            data = as_compatible_data(data)\n            coords, dims = _infer_coords_and_dims(data.shape, coords, dims)\n            variable = Variable(dims, data, attrs, encoding, fastpath=True)\n\n        # These fully describe a DataArray\n        self._variable = variable\n        self._coords = coords\n        self._name = name"
        },
        {
          "file": "xray/core/dataset.py",
          "type": "function",
          "name": "__init__",
          "class_name": "Dataset",
          "code": "def __init__(self, data_vars=None, coords=None, attrs=None,\n                 compat='broadcast_equals', **kwargs):\n        \"\"\"To load data from a file or file-like object, use the `open_dataset`\n        function.\n\n        Parameters\n        ----------\n        data_vars : dict-like, optional\n            A mapping from variable names to :py:class:`~xray.DataArray`\n            objects, :py:class:`~xray.Variable` objects or tuples of the\n            form ``(dims, data[, attrs])`` which can be used as arguments to\n            create a new ``Variable``. Each dimension must have the same length\n            in all variables in which it appears.\n        coords : dict-like, optional\n            Another mapping in the same form as the `variables` argument,\n            except the each item is saved on the dataset as a \"coordinate\".\n            These variables have an associated meaning: they describe\n            constant/fixed/independent quantities, unlike the\n            varying/measured/dependent quantities that belong in `variables`.\n            Coordinates values may be given by 1-dimensional arrays or scalars,\n            in which case `dims` do not need to be supplied: 1D arrays will be\n            assumed to give index values along the dimension with the same\n            name.\n        attrs : dict-like, optional\n            Global attributes to save on this dataset.\n        compat : {'broadcast_equals', 'equals', 'identical'}, optional\n            String indicating how to compare variables of the same name for\n            potential conflicts:\n\n            - 'broadcast_equals': all values must be equal when variables are\n              broadcast against each other to ensure common dimensions.\n            - 'equals': all values and dimensions must be the same.\n            - 'identical': all values, dimensions and attributes must be the\n              same.\n        \"\"\"\n        self._variables = OrderedDict()\n        self._coord_names = set()\n        self._dims = {}\n        self._attrs = None\n        self._file_obj = None\n        if kwargs:\n            if 'variables' in kwargs:\n                data_vars = kwargs.pop('variables')\n                warnings.warn('Variables kwarg is deprecated. Use data_vars', stacklevel=2)\n            if kwargs:\n                raise TypeError('{0} are not valid kwargs'.format(kwargs.keys()))\n        if data_vars is None:\n            data_vars = {}\n        if coords is None:\n            coords = set()\n        if data_vars is not None or coords is not None:\n            self._set_init_vars_and_dims(data_vars, coords, compat)\n        if attrs is not None:\n            self.attrs = attrs"
        },
        {
          "file": "xray/core/dataset.py",
          "type": "function",
          "name": "_construct_direct",
          "class_name": "Dataset",
          "code": "def _construct_direct(cls, variables, coord_names, dims, attrs,\n                          file_obj=None):\n        \"\"\"Shortcut around __init__ for internal use when we want to skip\n        costly validation\n        \"\"\"\n        obj = object.__new__(cls)\n        obj._variables = variables\n        obj._coord_names = coord_names\n        obj._dims = dims\n        obj._attrs = attrs\n        obj._file_obj = file_obj\n        return obj"
        }
      ]
    }
  ]
}