Why Gemfury? Push, build, and install  RubyGems npm packages Python packages Maven artifacts PHP packages Go Modules Debian packages RPM packages NuGet packages

Repository URL to install this package:

Details    
pandas / tests / sparse / test_groupby.py
Size: Mime:
# -*- coding: utf-8 -*-
import numpy as np
import pandas as pd
import pandas.util.testing as tm


class TestSparseGroupBy(object):

    def setup_method(self, method):
        self.dense = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
                                         'foo', 'bar', 'foo', 'foo'],
                                   'B': ['one', 'one', 'two', 'three',
                                         'two', 'two', 'one', 'three'],
                                   'C': np.random.randn(8),
                                   'D': np.random.randn(8),
                                   'E': [np.nan, np.nan, 1, 2,
                                         np.nan, 1, np.nan, np.nan]})
        self.sparse = self.dense.to_sparse()

    def test_first_last_nth(self):
        # tests for first / last / nth
        sparse_grouped = self.sparse.groupby('A')
        dense_grouped = self.dense.groupby('A')

        tm.assert_frame_equal(sparse_grouped.first(),
                              dense_grouped.first())
        tm.assert_frame_equal(sparse_grouped.last(),
                              dense_grouped.last())
        tm.assert_frame_equal(sparse_grouped.nth(1),
                              dense_grouped.nth(1))

    def test_aggfuncs(self):
        sparse_grouped = self.sparse.groupby('A')
        dense_grouped = self.dense.groupby('A')

        tm.assert_frame_equal(sparse_grouped.mean(),
                              dense_grouped.mean())

        # ToDo: sparse sum includes str column
        # tm.assert_frame_equal(sparse_grouped.sum(),
        #                       dense_grouped.sum())

        tm.assert_frame_equal(sparse_grouped.count(),
                              dense_grouped.count())