test_timedelta.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335
  1. from datetime import timedelta
  2. import numpy as np
  3. import pytest
  4. import pandas as pd
  5. from pandas import (
  6. DataFrame, Index, Int64Index, Series, Timedelta, TimedeltaIndex,
  7. date_range, timedelta_range)
  8. import pandas.util.testing as tm
  9. from pandas.util.testing import (
  10. assert_almost_equal, assert_index_equal, assert_series_equal)
  11. from ..datetimelike import DatetimeLike
  12. randn = np.random.randn
  13. class TestTimedeltaIndex(DatetimeLike):
  14. _holder = TimedeltaIndex
  15. def setup_method(self, method):
  16. self.indices = dict(index=tm.makeTimedeltaIndex(10))
  17. self.setup_indices()
  18. def create_index(self):
  19. return pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
  20. def test_numeric_compat(self):
  21. # Dummy method to override super's version; this test is now done
  22. # in test_arithmetic.py
  23. pass
  24. def test_shift(self):
  25. pass # this is handled in test_arithmetic.py
  26. def test_pickle_compat_construction(self):
  27. pass
  28. def test_fillna_timedelta(self):
  29. # GH 11343
  30. idx = pd.TimedeltaIndex(['1 day', pd.NaT, '3 day'])
  31. exp = pd.TimedeltaIndex(['1 day', '2 day', '3 day'])
  32. tm.assert_index_equal(idx.fillna(pd.Timedelta('2 day')), exp)
  33. exp = pd.TimedeltaIndex(['1 day', '3 hour', '3 day'])
  34. idx.fillna(pd.Timedelta('3 hour'))
  35. exp = pd.Index(
  36. [pd.Timedelta('1 day'), 'x', pd.Timedelta('3 day')], dtype=object)
  37. tm.assert_index_equal(idx.fillna('x'), exp)
  38. @pytest.mark.parametrize("sort", [None, False])
  39. def test_difference_freq(self, sort):
  40. # GH14323: Difference of TimedeltaIndex should not preserve frequency
  41. index = timedelta_range("0 days", "5 days", freq="D")
  42. other = timedelta_range("1 days", "4 days", freq="D")
  43. expected = TimedeltaIndex(["0 days", "5 days"], freq=None)
  44. idx_diff = index.difference(other, sort)
  45. tm.assert_index_equal(idx_diff, expected)
  46. tm.assert_attr_equal('freq', idx_diff, expected)
  47. other = timedelta_range("2 days", "5 days", freq="D")
  48. idx_diff = index.difference(other, sort)
  49. expected = TimedeltaIndex(["0 days", "1 days"], freq=None)
  50. tm.assert_index_equal(idx_diff, expected)
  51. tm.assert_attr_equal('freq', idx_diff, expected)
  52. @pytest.mark.parametrize("sort", [None, False])
  53. def test_difference_sort(self, sort):
  54. index = pd.TimedeltaIndex(["5 days", "3 days", "2 days", "4 days",
  55. "1 days", "0 days"])
  56. other = timedelta_range("1 days", "4 days", freq="D")
  57. idx_diff = index.difference(other, sort)
  58. expected = TimedeltaIndex(["5 days", "0 days"], freq=None)
  59. if sort is None:
  60. expected = expected.sort_values()
  61. tm.assert_index_equal(idx_diff, expected)
  62. tm.assert_attr_equal('freq', idx_diff, expected)
  63. other = timedelta_range("2 days", "5 days", freq="D")
  64. idx_diff = index.difference(other, sort)
  65. expected = TimedeltaIndex(["1 days", "0 days"], freq=None)
  66. if sort is None:
  67. expected = expected.sort_values()
  68. tm.assert_index_equal(idx_diff, expected)
  69. tm.assert_attr_equal('freq', idx_diff, expected)
  70. def test_isin(self):
  71. index = tm.makeTimedeltaIndex(4)
  72. result = index.isin(index)
  73. assert result.all()
  74. result = index.isin(list(index))
  75. assert result.all()
  76. assert_almost_equal(index.isin([index[2], 5]),
  77. np.array([False, False, True, False]))
  78. def test_factorize(self):
  79. idx1 = TimedeltaIndex(['1 day', '1 day', '2 day', '2 day', '3 day',
  80. '3 day'])
  81. exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.intp)
  82. exp_idx = TimedeltaIndex(['1 day', '2 day', '3 day'])
  83. arr, idx = idx1.factorize()
  84. tm.assert_numpy_array_equal(arr, exp_arr)
  85. tm.assert_index_equal(idx, exp_idx)
  86. arr, idx = idx1.factorize(sort=True)
  87. tm.assert_numpy_array_equal(arr, exp_arr)
  88. tm.assert_index_equal(idx, exp_idx)
  89. # freq must be preserved
  90. idx3 = timedelta_range('1 day', periods=4, freq='s')
  91. exp_arr = np.array([0, 1, 2, 3], dtype=np.intp)
  92. arr, idx = idx3.factorize()
  93. tm.assert_numpy_array_equal(arr, exp_arr)
  94. tm.assert_index_equal(idx, idx3)
  95. def test_join_self(self, join_type):
  96. index = timedelta_range('1 day', periods=10)
  97. joined = index.join(index, how=join_type)
  98. tm.assert_index_equal(index, joined)
  99. def test_does_not_convert_mixed_integer(self):
  100. df = tm.makeCustomDataframe(10, 10,
  101. data_gen_f=lambda *args, **kwargs: randn(),
  102. r_idx_type='i', c_idx_type='td')
  103. str(df)
  104. cols = df.columns.join(df.index, how='outer')
  105. joined = cols.join(df.columns)
  106. assert cols.dtype == np.dtype('O')
  107. assert cols.dtype == joined.dtype
  108. tm.assert_index_equal(cols, joined)
  109. def test_sort_values(self):
  110. idx = TimedeltaIndex(['4d', '1d', '2d'])
  111. ordered = idx.sort_values()
  112. assert ordered.is_monotonic
  113. ordered = idx.sort_values(ascending=False)
  114. assert ordered[::-1].is_monotonic
  115. ordered, dexer = idx.sort_values(return_indexer=True)
  116. assert ordered.is_monotonic
  117. tm.assert_numpy_array_equal(dexer, np.array([1, 2, 0]),
  118. check_dtype=False)
  119. ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
  120. assert ordered[::-1].is_monotonic
  121. tm.assert_numpy_array_equal(dexer, np.array([0, 2, 1]),
  122. check_dtype=False)
  123. def test_get_duplicates(self):
  124. idx = TimedeltaIndex(['1 day', '2 day', '2 day', '3 day', '3day',
  125. '4day'])
  126. with tm.assert_produces_warning(FutureWarning):
  127. # Deprecated - see GH20239
  128. result = idx.get_duplicates()
  129. ex = TimedeltaIndex(['2 day', '3day'])
  130. tm.assert_index_equal(result, ex)
  131. def test_argmin_argmax(self):
  132. idx = TimedeltaIndex(['1 day 00:00:05', '1 day 00:00:01',
  133. '1 day 00:00:02'])
  134. assert idx.argmin() == 1
  135. assert idx.argmax() == 0
  136. def test_misc_coverage(self):
  137. rng = timedelta_range('1 day', periods=5)
  138. result = rng.groupby(rng.days)
  139. assert isinstance(list(result.values())[0][0], Timedelta)
  140. idx = TimedeltaIndex(['3d', '1d', '2d'])
  141. assert not idx.equals(list(idx))
  142. non_td = Index(list('abc'))
  143. assert not idx.equals(list(non_td))
  144. def test_map(self):
  145. # test_map_dictlike generally tests
  146. rng = timedelta_range('1 day', periods=10)
  147. f = lambda x: x.days
  148. result = rng.map(f)
  149. exp = Int64Index([f(x) for x in rng])
  150. tm.assert_index_equal(result, exp)
  151. def test_pass_TimedeltaIndex_to_index(self):
  152. rng = timedelta_range('1 days', '10 days')
  153. idx = Index(rng, dtype=object)
  154. expected = Index(rng.to_pytimedelta(), dtype=object)
  155. tm.assert_numpy_array_equal(idx.values, expected.values)
  156. def test_pickle(self):
  157. rng = timedelta_range('1 days', periods=10)
  158. rng_p = tm.round_trip_pickle(rng)
  159. tm.assert_index_equal(rng, rng_p)
  160. def test_hash_error(self):
  161. index = timedelta_range('1 days', periods=10)
  162. with pytest.raises(TypeError, match=("unhashable type: %r" %
  163. type(index).__name__)):
  164. hash(index)
  165. def test_append_join_nondatetimeindex(self):
  166. rng = timedelta_range('1 days', periods=10)
  167. idx = Index(['a', 'b', 'c', 'd'])
  168. result = rng.append(idx)
  169. assert isinstance(result[0], Timedelta)
  170. # it works
  171. rng.join(idx, how='outer')
  172. def test_append_numpy_bug_1681(self):
  173. td = timedelta_range('1 days', '10 days', freq='2D')
  174. a = DataFrame()
  175. c = DataFrame({'A': 'foo', 'B': td}, index=td)
  176. str(c)
  177. result = a.append(c)
  178. assert (result['B'] == td).all()
  179. def test_fields(self):
  180. rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
  181. freq='s')
  182. tm.assert_index_equal(rng.days, Index([1, 1], dtype='int64'))
  183. tm.assert_index_equal(
  184. rng.seconds,
  185. Index([10 * 3600 + 11 * 60 + 12, 10 * 3600 + 11 * 60 + 13],
  186. dtype='int64'))
  187. tm.assert_index_equal(
  188. rng.microseconds,
  189. Index([100 * 1000 + 123, 100 * 1000 + 123], dtype='int64'))
  190. tm.assert_index_equal(rng.nanoseconds,
  191. Index([456, 456], dtype='int64'))
  192. pytest.raises(AttributeError, lambda: rng.hours)
  193. pytest.raises(AttributeError, lambda: rng.minutes)
  194. pytest.raises(AttributeError, lambda: rng.milliseconds)
  195. # with nat
  196. s = Series(rng)
  197. s[1] = np.nan
  198. tm.assert_series_equal(s.dt.days, Series([1, np.nan], index=[0, 1]))
  199. tm.assert_series_equal(s.dt.seconds, Series(
  200. [10 * 3600 + 11 * 60 + 12, np.nan], index=[0, 1]))
  201. # preserve name (GH15589)
  202. rng.name = 'name'
  203. assert rng.days.name == 'name'
  204. def test_freq_conversion(self):
  205. # doc example
  206. # series
  207. td = Series(date_range('20130101', periods=4)) - \
  208. Series(date_range('20121201', periods=4))
  209. td[2] += timedelta(minutes=5, seconds=3)
  210. td[3] = np.nan
  211. result = td / np.timedelta64(1, 'D')
  212. expected = Series([31, 31, (31 * 86400 + 5 * 60 + 3) / 86400.0, np.nan
  213. ])
  214. assert_series_equal(result, expected)
  215. result = td.astype('timedelta64[D]')
  216. expected = Series([31, 31, 31, np.nan])
  217. assert_series_equal(result, expected)
  218. result = td / np.timedelta64(1, 's')
  219. expected = Series([31 * 86400, 31 * 86400, 31 * 86400 + 5 * 60 + 3,
  220. np.nan])
  221. assert_series_equal(result, expected)
  222. result = td.astype('timedelta64[s]')
  223. assert_series_equal(result, expected)
  224. # tdi
  225. td = TimedeltaIndex(td)
  226. result = td / np.timedelta64(1, 'D')
  227. expected = Index([31, 31, (31 * 86400 + 5 * 60 + 3) / 86400.0, np.nan])
  228. assert_index_equal(result, expected)
  229. result = td.astype('timedelta64[D]')
  230. expected = Index([31, 31, 31, np.nan])
  231. assert_index_equal(result, expected)
  232. result = td / np.timedelta64(1, 's')
  233. expected = Index([31 * 86400, 31 * 86400, 31 * 86400 + 5 * 60 + 3,
  234. np.nan])
  235. assert_index_equal(result, expected)
  236. result = td.astype('timedelta64[s]')
  237. assert_index_equal(result, expected)
  238. class TestTimeSeries(object):
  239. def test_series_box_timedelta(self):
  240. rng = timedelta_range('1 day 1 s', periods=5, freq='h')
  241. s = Series(rng)
  242. assert isinstance(s[1], Timedelta)
  243. assert isinstance(s.iat[2], Timedelta)