holoviz · jlstevens · Mar 5, 2017 · Mar 5, 2017 · Mar 5, 2017 · Mar 5, 2017
diff --git a/holoviews/core/data/__init__.py b/holoviews/core/data/__init__.py
@@ -518,7 +518,9 @@ def get_dimension_type(self, dim):
 
     def dframe(self, dimensions=None):
         """
-        Returns the data in the form of a DataFrame.
+        Returns the data in the form of a DataFrame. Supplying a list
+        of dimensions filters the dataframe. If the data is already
+        a DataFrame a copy is returned.
         """
         if dimensions:
             dimensions = [self.get_dimension(d, strict=True).name for d in dimensions]

diff --git a/holoviews/core/data/pandas.py b/holoviews/core/data/pandas.py
@@ -222,6 +222,18 @@ def add_dimension(cls, columns, dimension, dim_pos, values, vdim):
         return data
 
 
+    @classmethod
+    def as_dframe(cls, dataset):
+        """
+        Returns the data of a Dataset as a dataframe avoiding copying
+        if it already a dataframe type.
+        """
+        if issubclass(dataset.interface, PandasInterface):
+            return dataset.data
+        else:
+            return dataset.dframe()
+
+
     @classmethod
     def dframe(cls, columns, dimensions):
         if dimensions:

diff --git a/holoviews/element/util.py b/holoviews/element/util.py
@@ -5,8 +5,14 @@
 
 from ..core import Dataset, OrderedDict
 from ..core.operation import ElementOperation
-from ..core.util import (pd, is_nan, sort_topologically,
-                         cartesian_product, is_cyclic, one_to_one)
+from ..core.util import (is_nan, sort_topologically, one_to_one,
+                         cartesian_product, is_cyclic)
+
+try:
+    import pandas as pd
+    from ..core.data import PandasInterface
+except:
+    pd = None
 
 try:
     import dask
@@ -134,7 +140,13 @@ def _aggregate_dataset(self, obj, xcoords, ycoords):
         dtype = 'dataframe' if pd else 'dictionary'
         dense_data = Dataset(data, kdims=obj.kdims, vdims=obj.vdims, datatype=[dtype])
         concat_data = obj.interface.concatenate([dense_data, obj], datatype=[dtype])
-        agg = concat_data.reindex([xdim, ydim], vdims).aggregate([xdim, ydim], reduce_fn)
+        reindexed = concat_data.reindex([xdim, ydim], vdims)
+        if pd:
+            df = PandasInterface.as_dframe(reindexed)
+            df = df.groupby([xdim, ydim], sort=False).first().reset_index()
+            agg = reindexed.clone(df)
+        else:
+            agg = reindexed.aggregate([xdim, ydim], reduce_fn)
 
         # Convert data to a gridded dataset
         grid_data = {xdim: xcoords, ydim: ycoords}

diff --git a/holoviews/operation/datashader.py b/holoviews/operation/datashader.py
@@ -20,23 +20,19 @@
 
 from ..core import (ElementOperation, Element, Dimension, NdOverlay,
                     Overlay, CompositeOverlay, Dataset)
-from ..core.data import ArrayInterface, PandasInterface, DaskInterface
+from ..core.data import PandasInterface, DaskInterface
 from ..core.util import get_param_values, basestring
 from ..element import GridImage, Image, Path, Curve, Contours, RGB
 from ..streams import RangeXY
 
-DF_INTERFACES = [PandasInterface, DaskInterface]
 
 @dispatch(Element)
 def discover(dataset):
     """
     Allows datashader to correctly discover the dtypes of the data
     in a holoviews Element.
     """
-    if dataset.interface in DF_INTERFACES:
-        return dsdiscover(dataset.data)
-    else:
-        return dsdiscover(dataset.dframe())
+    return dsdiscover(PandasInterface.as_dframe(element))
 
 
 @bypixel.pipeline.register(Element)
@@ -135,7 +131,6 @@ def get_agg_data(cls, obj, category=None):
         kdims = obj.kdims
         vdims = obj.vdims
         x, y = obj.dimensions(label=True)[:2]
-        is_df = lambda x: isinstance(x, Dataset) and x.interface in DF_INTERFACES
         if isinstance(obj, Path):
             glyph = 'line'
             for p in obj.data:
@@ -146,7 +141,7 @@ def get_agg_data(cls, obj, category=None):
         elif isinstance(obj, CompositeOverlay):
             for key, el in obj.data.items():
                 x, y, element, glyph = cls.get_agg_data(el)
-                df = element.data if is_df(element) else element.dframe()
+                df = PandasInterface.as_dframe(element)
                 if isinstance(obj, NdOverlay):
                     df = df.assign(**dict(zip(obj.dimensions('key', True), key)))
                 paths.append(df)