123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202 |
- import numpy as np
- import pytest
- from pandas import (
- Index,
- IntervalIndex,
- Timestamp,
- interval_range,
- )
- import pandas._testing as tm
- def monotonic_index(start, end, dtype="int64", closed="right"):
- return IntervalIndex.from_breaks(np.arange(start, end, dtype=dtype), closed=closed)
- def empty_index(dtype="int64", closed="right"):
- return IntervalIndex(np.array([], dtype=dtype), closed=closed)
- class TestIntervalIndex:
- def test_union(self, closed, sort):
- index = monotonic_index(0, 11, closed=closed)
- other = monotonic_index(5, 13, closed=closed)
- expected = monotonic_index(0, 13, closed=closed)
- result = index[::-1].union(other, sort=sort)
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- result = other[::-1].union(index, sort=sort)
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- tm.assert_index_equal(index.union(index, sort=sort), index)
- tm.assert_index_equal(index.union(index[:1], sort=sort), index)
- def test_union_empty_result(self, closed, sort):
- # GH 19101: empty result, same dtype
- index = empty_index(dtype="int64", closed=closed)
- result = index.union(index, sort=sort)
- tm.assert_index_equal(result, index)
- # GH 19101: empty result, different numeric dtypes -> common dtype is f8
- other = empty_index(dtype="float64", closed=closed)
- result = index.union(other, sort=sort)
- expected = other
- tm.assert_index_equal(result, expected)
- other = index.union(index, sort=sort)
- tm.assert_index_equal(result, expected)
- other = empty_index(dtype="uint64", closed=closed)
- result = index.union(other, sort=sort)
- tm.assert_index_equal(result, expected)
- result = other.union(index, sort=sort)
- tm.assert_index_equal(result, expected)
- def test_intersection(self, closed, sort):
- index = monotonic_index(0, 11, closed=closed)
- other = monotonic_index(5, 13, closed=closed)
- expected = monotonic_index(5, 11, closed=closed)
- result = index[::-1].intersection(other, sort=sort)
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- result = other[::-1].intersection(index, sort=sort)
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- tm.assert_index_equal(index.intersection(index, sort=sort), index)
- # GH 26225: nested intervals
- index = IntervalIndex.from_tuples([(1, 2), (1, 3), (1, 4), (0, 2)])
- other = IntervalIndex.from_tuples([(1, 2), (1, 3)])
- expected = IntervalIndex.from_tuples([(1, 2), (1, 3)])
- result = index.intersection(other)
- tm.assert_index_equal(result, expected)
- # GH 26225
- index = IntervalIndex.from_tuples([(0, 3), (0, 2)])
- other = IntervalIndex.from_tuples([(0, 2), (1, 3)])
- expected = IntervalIndex.from_tuples([(0, 2)])
- result = index.intersection(other)
- tm.assert_index_equal(result, expected)
- # GH 26225: duplicate nan element
- index = IntervalIndex([np.nan, np.nan])
- other = IntervalIndex([np.nan])
- expected = IntervalIndex([np.nan])
- result = index.intersection(other)
- tm.assert_index_equal(result, expected)
- def test_intersection_empty_result(self, closed, sort):
- index = monotonic_index(0, 11, closed=closed)
- # GH 19101: empty result, same dtype
- other = monotonic_index(300, 314, closed=closed)
- expected = empty_index(dtype="int64", closed=closed)
- result = index.intersection(other, sort=sort)
- tm.assert_index_equal(result, expected)
- # GH 19101: empty result, different numeric dtypes -> common dtype is float64
- other = monotonic_index(300, 314, dtype="float64", closed=closed)
- result = index.intersection(other, sort=sort)
- expected = other[:0]
- tm.assert_index_equal(result, expected)
- other = monotonic_index(300, 314, dtype="uint64", closed=closed)
- result = index.intersection(other, sort=sort)
- tm.assert_index_equal(result, expected)
- def test_intersection_duplicates(self):
- # GH#38743
- index = IntervalIndex.from_tuples([(1, 2), (1, 2), (2, 3), (3, 4)])
- other = IntervalIndex.from_tuples([(1, 2), (2, 3)])
- expected = IntervalIndex.from_tuples([(1, 2), (2, 3)])
- result = index.intersection(other)
- tm.assert_index_equal(result, expected)
- def test_difference(self, closed, sort):
- index = IntervalIndex.from_arrays([1, 0, 3, 2], [1, 2, 3, 4], closed=closed)
- result = index.difference(index[:1], sort=sort)
- expected = index[1:]
- if sort is None:
- expected = expected.sort_values()
- tm.assert_index_equal(result, expected)
- # GH 19101: empty result, same dtype
- result = index.difference(index, sort=sort)
- expected = empty_index(dtype="int64", closed=closed)
- tm.assert_index_equal(result, expected)
- # GH 19101: empty result, different dtypes
- other = IntervalIndex.from_arrays(
- index.left.astype("float64"), index.right, closed=closed
- )
- result = index.difference(other, sort=sort)
- tm.assert_index_equal(result, expected)
- def test_symmetric_difference(self, closed, sort):
- index = monotonic_index(0, 11, closed=closed)
- result = index[1:].symmetric_difference(index[:-1], sort=sort)
- expected = IntervalIndex([index[0], index[-1]])
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- # GH 19101: empty result, same dtype
- result = index.symmetric_difference(index, sort=sort)
- expected = empty_index(dtype="int64", closed=closed)
- if sort is None:
- tm.assert_index_equal(result, expected)
- assert tm.equalContents(result, expected)
- # GH 19101: empty result, different dtypes
- other = IntervalIndex.from_arrays(
- index.left.astype("float64"), index.right, closed=closed
- )
- result = index.symmetric_difference(other, sort=sort)
- expected = empty_index(dtype="float64", closed=closed)
- tm.assert_index_equal(result, expected)
- @pytest.mark.filterwarnings("ignore:'<' not supported between:RuntimeWarning")
- @pytest.mark.parametrize(
- "op_name", ["union", "intersection", "difference", "symmetric_difference"]
- )
- def test_set_incompatible_types(self, closed, op_name, sort):
- index = monotonic_index(0, 11, closed=closed)
- set_op = getattr(index, op_name)
- # TODO: standardize return type of non-union setops type(self vs other)
- # non-IntervalIndex
- if op_name == "difference":
- expected = index
- else:
- expected = getattr(index.astype("O"), op_name)(Index([1, 2, 3]))
- result = set_op(Index([1, 2, 3]), sort=sort)
- tm.assert_index_equal(result, expected)
- # mixed closed -> cast to object
- for other_closed in {"right", "left", "both", "neither"} - {closed}:
- other = monotonic_index(0, 11, closed=other_closed)
- expected = getattr(index.astype(object), op_name)(other, sort=sort)
- if op_name == "difference":
- expected = index
- result = set_op(other, sort=sort)
- tm.assert_index_equal(result, expected)
- # GH 19016: incompatible dtypes -> cast to object
- other = interval_range(Timestamp("20180101"), periods=9, closed=closed)
- expected = getattr(index.astype(object), op_name)(other, sort=sort)
- if op_name == "difference":
- expected = index
- result = set_op(other, sort=sort)
- tm.assert_index_equal(result, expected)
|