eland/tests/series/test_value_counts_pytest.py
2020-11-16 11:30:41 -06:00

78 lines
2.7 KiB
Python

# Licensed to Elasticsearch B.V. under one or more contributor
# license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright
# ownership. Elasticsearch B.V. licenses this file to you under
# the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
# File called _pytest for PyCharm compatability
import pytest
from pandas.testing import assert_series_equal
from tests.common import TestData
class TestSeriesValueCounts(TestData):
def test_value_counts(self):
pd_s = self.pd_flights()["Carrier"]
ed_s = self.ed_flights()["Carrier"]
pd_vc = pd_s.value_counts()
ed_vc = ed_s.value_counts()
assert_series_equal(pd_vc, ed_vc)
def test_value_counts_size(self):
pd_s = self.pd_flights()["Carrier"]
ed_s = self.ed_flights()["Carrier"]
pd_vc = pd_s.value_counts()[:1]
ed_vc = ed_s.value_counts(es_size=1)
assert_series_equal(pd_vc, ed_vc)
def test_value_counts_keyerror(self):
ed_f = self.ed_flights()
with pytest.raises(KeyError):
assert ed_f["not_a_column"].value_counts()
def test_value_counts_dataframe(self):
# value_counts() is a series method, should raise AttributeError if called on a DataFrame
ed_f = self.ed_flights()
with pytest.raises(AttributeError):
assert ed_f.value_counts()
def test_value_counts_non_int(self):
ed_s = self.ed_flights()["Carrier"]
with pytest.raises(TypeError):
assert ed_s.value_counts(es_size="foo")
def test_value_counts_non_positive_int(self):
ed_s = self.ed_flights()["Carrier"]
with pytest.raises(ValueError):
assert ed_s.value_counts(es_size=-9)
@pytest.mark.filterwarnings("ignore:Aggregations not supported")
def test_value_counts_non_aggregatable(self):
ed_s = self.ed_ecommerce()["customer_first_name"]
pd_s = self.pd_ecommerce()["customer_first_name"]
pd_vc = pd_s.value_counts().head(20).sort_index()
ed_vc = ed_s.value_counts(es_size=20).sort_index()
assert_series_equal(pd_vc, ed_vc)
ed_s = self.ed_ecommerce()["customer_gender"]
with pytest.raises(ValueError):
assert ed_s.value_counts()