Skip to content

Commit 4ea52e6

Browse files
BUG: Fix Series comparison fails when index dtypes differ (object vs string) (pandas-dev#61099)
1 parent b69a2ae commit 4ea52e6

File tree

2 files changed

+39
-0
lines changed

2 files changed

+39
-0
lines changed

pandas/core/indexes/base.py

+9
Original file line numberDiff line numberDiff line change
@@ -5470,6 +5470,15 @@ def equals(self, other: Any) -> bool:
54705470
if len(self) != len(other):
54715471
# quickly return if the lengths are different
54725472
return False
5473+
5474+
if (
5475+
(isinstance(self.dtype, StringDtype)
5476+
or is_object_dtype(self.dtype))
5477+
and
5478+
(isinstance(other.dtype, StringDtype)
5479+
or is_object_dtype(other.dtype))
5480+
):
5481+
return array_equivalent(self.astype("object")._values, other.astype("object")._values)
54735482

54745483
if (
54755484
isinstance(self.dtype, StringDtype)

pandas/tests/indexes/test_base.py

+30
Original file line numberDiff line numberDiff line change
@@ -1717,3 +1717,33 @@ def test_is_monotonic_pyarrow_list_type():
17171717
idx = Index([[1], [2, 3]], dtype=pd.ArrowDtype(pa.list_(pa.int64())))
17181718
assert not idx.is_monotonic_increasing
17191719
assert not idx.is_monotonic_decreasing
1720+
1721+
def test_index_equals_string_vs_object():
1722+
idx1 = pd.Index(['a', 'b', 'c'])
1723+
idx2 = pd.Index(['a', 'b', 'c'], dtype='string')
1724+
assert idx1.equals(idx2)
1725+
assert idx2.equals(idx1)
1726+
1727+
def test_compare_string_vs_object_index_equality():
1728+
s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c']) # dtype=object
1729+
s2 = pd.Series([0, 1, 2], index=pd.Index(['a', 'b', 'c'], dtype='string')) # dtype=string
1730+
1731+
result = s1 > s2
1732+
expected = pd.Series([True, True, True], index=['a', 'b', 'c'])
1733+
pd.testing.assert_series_equal(result, expected)
1734+
1735+
def test_align_string_vs_object_index():
1736+
s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c']) # object
1737+
s2 = pd.Series([1, 2, 3], index=pd.Index(['a', 'b', 'c'], dtype='string')) # string
1738+
1739+
s1_aligned, s2_aligned = s1.align(s2)
1740+
assert list(s1_aligned.index) == list(s2_aligned.index)
1741+
1742+
def test_comparison_without_manual_casting():
1743+
s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c']) # object index
1744+
s2 = pd.Series([1, 2, 3], index=pd.Index(['a', 'b', 'c'], dtype='string'))
1745+
1746+
# Should not raise
1747+
result = s1 == s2
1748+
expected = pd.Series([True, True, True], index=['a', 'b', 'c'])
1749+
pd.testing.assert_series_equal(result, expected)

0 commit comments

Comments
 (0)