mirror of
https://github.com/aykhans/AzSuicideDataVisualization.git
synced 2025-07-02 06:22:25 +00:00
first commit
This commit is contained in:
210
.venv/Lib/site-packages/pandas/tests/extension/test_string.py
Normal file
210
.venv/Lib/site-packages/pandas/tests/extension/test_string.py
Normal file
@ -0,0 +1,210 @@
|
||||
"""
|
||||
This file contains a minimal set of tests for compliance with the extension
|
||||
array interface test suite, and should contain no other tests.
|
||||
The test suite for the full functionality of the array is located in
|
||||
`pandas/tests/arrays/`.
|
||||
|
||||
The tests in this file are inherited from the BaseExtensionTests, and only
|
||||
minimal tweaks should be applied to get the tests passing (by overwriting a
|
||||
parent method).
|
||||
|
||||
Additional tests should either be added to one of the BaseExtensionTests
|
||||
classes (if they are relevant for the extension interface for all dtypes), or
|
||||
be added to the array-specific tests in `pandas/tests/arrays/`.
|
||||
|
||||
"""
|
||||
import string
|
||||
|
||||
import numpy as np
|
||||
import pytest
|
||||
|
||||
from pandas.compat import pa_version_under2p0
|
||||
|
||||
import pandas as pd
|
||||
from pandas.core.arrays import ArrowStringArray
|
||||
from pandas.core.arrays.string_ import StringDtype
|
||||
from pandas.tests.extension import base
|
||||
|
||||
|
||||
def split_array(arr):
|
||||
if arr.dtype.storage != "pyarrow":
|
||||
pytest.skip("only applicable for pyarrow chunked array n/a")
|
||||
|
||||
def _split_array(arr):
|
||||
import pyarrow as pa
|
||||
|
||||
arrow_array = arr._data
|
||||
split = len(arrow_array) // 2
|
||||
arrow_array = pa.chunked_array(
|
||||
[*arrow_array[:split].chunks, *arrow_array[split:].chunks]
|
||||
)
|
||||
assert arrow_array.num_chunks == 2
|
||||
return type(arr)(arrow_array)
|
||||
|
||||
return _split_array(arr)
|
||||
|
||||
|
||||
@pytest.fixture(params=[True, False])
|
||||
def chunked(request):
|
||||
return request.param
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def dtype(string_storage):
|
||||
return StringDtype(storage=string_storage)
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def data(dtype, chunked):
|
||||
strings = np.random.choice(list(string.ascii_letters), size=100)
|
||||
while strings[0] == strings[1]:
|
||||
strings = np.random.choice(list(string.ascii_letters), size=100)
|
||||
|
||||
arr = dtype.construct_array_type()._from_sequence(strings)
|
||||
return split_array(arr) if chunked else arr
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def data_missing(dtype, chunked):
|
||||
"""Length 2 array with [NA, Valid]"""
|
||||
arr = dtype.construct_array_type()._from_sequence([pd.NA, "A"])
|
||||
return split_array(arr) if chunked else arr
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def data_for_sorting(dtype, chunked):
|
||||
arr = dtype.construct_array_type()._from_sequence(["B", "C", "A"])
|
||||
return split_array(arr) if chunked else arr
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def data_missing_for_sorting(dtype, chunked):
|
||||
arr = dtype.construct_array_type()._from_sequence(["B", pd.NA, "A"])
|
||||
return split_array(arr) if chunked else arr
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def na_value():
|
||||
return pd.NA
|
||||
|
||||
|
||||
@pytest.fixture
|
||||
def data_for_grouping(dtype, chunked):
|
||||
arr = dtype.construct_array_type()._from_sequence(
|
||||
["B", "B", pd.NA, pd.NA, "A", "A", "B", "C"]
|
||||
)
|
||||
return split_array(arr) if chunked else arr
|
||||
|
||||
|
||||
class TestDtype(base.BaseDtypeTests):
|
||||
def test_eq_with_str(self, dtype):
|
||||
assert dtype == f"string[{dtype.storage}]"
|
||||
super().test_eq_with_str(dtype)
|
||||
|
||||
|
||||
class TestInterface(base.BaseInterfaceTests):
|
||||
def test_view(self, data, request):
|
||||
if data.dtype.storage == "pyarrow":
|
||||
mark = pytest.mark.xfail(reason="not implemented")
|
||||
request.node.add_marker(mark)
|
||||
super().test_view(data)
|
||||
|
||||
|
||||
class TestConstructors(base.BaseConstructorsTests):
|
||||
def test_from_dtype(self, data):
|
||||
# base test uses string representation of dtype
|
||||
pass
|
||||
|
||||
|
||||
class TestReshaping(base.BaseReshapingTests):
|
||||
def test_transpose(self, data, request):
|
||||
if data.dtype.storage == "pyarrow":
|
||||
mark = pytest.mark.xfail(reason="not implemented")
|
||||
request.node.add_marker(mark)
|
||||
super().test_transpose(data)
|
||||
|
||||
|
||||
class TestGetitem(base.BaseGetitemTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestSetitem(base.BaseSetitemTests):
|
||||
def test_setitem_preserves_views(self, data, request):
|
||||
if data.dtype.storage == "pyarrow":
|
||||
mark = pytest.mark.xfail(reason="not implemented")
|
||||
request.node.add_marker(mark)
|
||||
super().test_setitem_preserves_views(data)
|
||||
|
||||
|
||||
class TestIndex(base.BaseIndexTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestMissing(base.BaseMissingTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestNoReduce(base.BaseNoReduceTests):
|
||||
@pytest.mark.parametrize("skipna", [True, False])
|
||||
def test_reduce_series_numeric(self, data, all_numeric_reductions, skipna):
|
||||
op_name = all_numeric_reductions
|
||||
|
||||
if op_name in ["min", "max"]:
|
||||
return None
|
||||
|
||||
ser = pd.Series(data)
|
||||
with pytest.raises(TypeError):
|
||||
getattr(ser, op_name)(skipna=skipna)
|
||||
|
||||
|
||||
class TestMethods(base.BaseMethodsTests):
|
||||
@pytest.mark.skip(reason="returns nullable")
|
||||
def test_value_counts(self, all_data, dropna):
|
||||
return super().test_value_counts(all_data, dropna)
|
||||
|
||||
@pytest.mark.xfail(reason="returns nullable: GH 44692")
|
||||
def test_value_counts_with_normalize(self, data):
|
||||
super().test_value_counts_with_normalize(data)
|
||||
|
||||
|
||||
class TestCasting(base.BaseCastingTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestComparisonOps(base.BaseComparisonOpsTests):
|
||||
def _compare_other(self, ser, data, op, other):
|
||||
op_name = f"__{op.__name__}__"
|
||||
result = getattr(ser, op_name)(other)
|
||||
expected = getattr(ser.astype(object), op_name)(other).astype("boolean")
|
||||
self.assert_series_equal(result, expected)
|
||||
|
||||
def test_compare_scalar(self, data, comparison_op):
|
||||
ser = pd.Series(data)
|
||||
self._compare_other(ser, data, comparison_op, "abc")
|
||||
|
||||
|
||||
class TestParsing(base.BaseParsingTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestPrinting(base.BasePrintingTests):
|
||||
pass
|
||||
|
||||
|
||||
class TestGroupBy(base.BaseGroupbyTests):
|
||||
def test_groupby_extension_transform(self, data_for_grouping, request):
|
||||
if data_for_grouping.dtype.storage == "pyarrow" and pa_version_under2p0:
|
||||
# failure observed in 1.0.1, not in 2.0 or later
|
||||
mark = pytest.mark.xfail(reason="pyarrow raises in self._data[item]")
|
||||
request.node.add_marker(mark)
|
||||
super().test_groupby_extension_transform(data_for_grouping)
|
||||
|
||||
|
||||
class Test2DCompat(base.Dim2CompatTests):
|
||||
@pytest.fixture(autouse=True)
|
||||
def arrow_not_supported(self, data, request):
|
||||
if isinstance(data, ArrowStringArray):
|
||||
mark = pytest.mark.xfail(
|
||||
reason="2D support not implemented for ArrowStringArray"
|
||||
)
|
||||
request.node.add_marker(mark)
|
Reference in New Issue
Block a user