PageRenderTime 57ms CodeModel.GetById 26ms RepoModel.GetById 0ms app.codeStats 0ms

/pandas/tseries/tests/test_tslib.py

https://github.com/ajcr/pandas
Python | 447 lines | 335 code | 78 blank | 34 comment | 22 complexity | 8eb74e6b721ebbaa37a7cacf9713e66d MD5 | raw file
Possible License(s): BSD-3-Clause, Apache-2.0
  1. import nose
  2. import numpy as np
  3. from pandas import tslib
  4. import datetime
  5. from pandas.core.api import Timestamp, Series
  6. from pandas.tslib import period_asfreq, period_ordinal
  7. from pandas.tseries.index import date_range
  8. from pandas.tseries.frequencies import get_freq
  9. import pandas.tseries.offsets as offsets
  10. from pandas import _np_version_under1p7
  11. import pandas.util.testing as tm
  12. from pandas.util.testing import assert_series_equal
  13. class TestTimestamp(tm.TestCase):
  14. def test_repr(self):
  15. date = '2014-03-07'
  16. tz = 'US/Eastern'
  17. freq = 'M'
  18. date_only = Timestamp(date)
  19. self.assertIn(date, repr(date_only))
  20. self.assertNotIn(tz, repr(date_only))
  21. self.assertNotIn(freq, repr(date_only))
  22. self.assertEqual(date_only, eval(repr(date_only)))
  23. date_tz = Timestamp(date, tz=tz)
  24. self.assertIn(date, repr(date_tz))
  25. self.assertIn(tz, repr(date_tz))
  26. self.assertNotIn(freq, repr(date_tz))
  27. self.assertEqual(date_tz, eval(repr(date_tz)))
  28. date_freq = Timestamp(date, offset=freq)
  29. self.assertIn(date, repr(date_freq))
  30. self.assertNotIn(tz, repr(date_freq))
  31. self.assertIn(freq, repr(date_freq))
  32. self.assertEqual(date_freq, eval(repr(date_freq)))
  33. date_tz_freq = Timestamp(date, tz=tz, offset=freq)
  34. self.assertIn(date, repr(date_tz_freq))
  35. self.assertIn(tz, repr(date_tz_freq))
  36. self.assertIn(freq, repr(date_tz_freq))
  37. self.assertEqual(date_tz_freq, eval(repr(date_tz_freq)))
  38. # this can cause the tz field to be populated, but it's redundant to information in the datestring
  39. date_with_utc_offset = Timestamp('2014-03-13 00:00:00-0400', tz=None)
  40. self.assertIn('2014-03-13 00:00:00-0400', repr(date_with_utc_offset))
  41. self.assertNotIn('tzoffset', repr(date_with_utc_offset))
  42. self.assertEqual(date_with_utc_offset, eval(repr(date_with_utc_offset)))
  43. def test_bounds_with_different_units(self):
  44. out_of_bounds_dates = (
  45. '1677-09-21',
  46. '2262-04-12',
  47. )
  48. time_units = ('D', 'h', 'm', 's', 'ms', 'us')
  49. for date_string in out_of_bounds_dates:
  50. for unit in time_units:
  51. self.assertRaises(
  52. ValueError,
  53. Timestamp,
  54. np.datetime64(date_string, dtype='M8[%s]' % unit)
  55. )
  56. in_bounds_dates = (
  57. '1677-09-23',
  58. '2262-04-11',
  59. )
  60. for date_string in in_bounds_dates:
  61. for unit in time_units:
  62. Timestamp(
  63. np.datetime64(date_string, dtype='M8[%s]' % unit)
  64. )
  65. def test_tz(self):
  66. t = '2014-02-01 09:00'
  67. ts = Timestamp(t)
  68. local = ts.tz_localize('Asia/Tokyo')
  69. self.assertEqual(local.hour, 9)
  70. self.assertEqual(local, Timestamp(t, tz='Asia/Tokyo'))
  71. conv = local.tz_convert('US/Eastern')
  72. self.assertEqual(conv,
  73. Timestamp('2014-01-31 19:00', tz='US/Eastern'))
  74. self.assertEqual(conv.hour, 19)
  75. # preserves nanosecond
  76. ts = Timestamp(t) + offsets.Nano(5)
  77. local = ts.tz_localize('Asia/Tokyo')
  78. self.assertEqual(local.hour, 9)
  79. self.assertEqual(local.nanosecond, 5)
  80. conv = local.tz_convert('US/Eastern')
  81. self.assertEqual(conv.nanosecond, 5)
  82. self.assertEqual(conv.hour, 19)
  83. def test_barely_oob_dts(self):
  84. one_us = np.timedelta64(1)
  85. # By definition we can't go out of bounds in [ns], so we
  86. # convert the datetime64s to [us] so we can go out of bounds
  87. min_ts_us = np.datetime64(Timestamp.min).astype('M8[us]')
  88. max_ts_us = np.datetime64(Timestamp.max).astype('M8[us]')
  89. # No error for the min/max datetimes
  90. Timestamp(min_ts_us)
  91. Timestamp(max_ts_us)
  92. # One us less than the minimum is an error
  93. self.assertRaises(ValueError, Timestamp, min_ts_us - one_us)
  94. # One us more than the maximum is an error
  95. self.assertRaises(ValueError, Timestamp, max_ts_us + one_us)
  96. class TestDatetimeParsingWrappers(tm.TestCase):
  97. def test_does_not_convert_mixed_integer(self):
  98. bad_date_strings = (
  99. '-50000',
  100. '999',
  101. '123.1234',
  102. 'm',
  103. 'T'
  104. )
  105. for bad_date_string in bad_date_strings:
  106. self.assertFalse(
  107. tslib._does_string_look_like_datetime(bad_date_string)
  108. )
  109. good_date_strings = (
  110. '2012-01-01',
  111. '01/01/2012',
  112. 'Mon Sep 16, 2013',
  113. '01012012',
  114. '0101',
  115. '1-1',
  116. )
  117. for good_date_string in good_date_strings:
  118. self.assertTrue(
  119. tslib._does_string_look_like_datetime(good_date_string)
  120. )
  121. class TestArrayToDatetime(tm.TestCase):
  122. def test_parsing_valid_dates(self):
  123. arr = np.array(['01-01-2013', '01-02-2013'], dtype=object)
  124. self.assert_numpy_array_equal(
  125. tslib.array_to_datetime(arr),
  126. np.array(
  127. [
  128. '2013-01-01T00:00:00.000000000-0000',
  129. '2013-01-02T00:00:00.000000000-0000'
  130. ],
  131. dtype='M8[ns]'
  132. )
  133. )
  134. arr = np.array(['Mon Sep 16 2013', 'Tue Sep 17 2013'], dtype=object)
  135. self.assert_numpy_array_equal(
  136. tslib.array_to_datetime(arr),
  137. np.array(
  138. [
  139. '2013-09-16T00:00:00.000000000-0000',
  140. '2013-09-17T00:00:00.000000000-0000'
  141. ],
  142. dtype='M8[ns]'
  143. )
  144. )
  145. def test_number_looking_strings_not_into_datetime(self):
  146. # #4601
  147. # These strings don't look like datetimes so they shouldn't be
  148. # attempted to be converted
  149. arr = np.array(['-352.737091', '183.575577'], dtype=object)
  150. self.assert_numpy_array_equal(tslib.array_to_datetime(arr), arr)
  151. arr = np.array(['1', '2', '3', '4', '5'], dtype=object)
  152. self.assert_numpy_array_equal(tslib.array_to_datetime(arr), arr)
  153. def test_coercing_dates_outside_of_datetime64_ns_bounds(self):
  154. invalid_dates = [
  155. datetime.date(1000, 1, 1),
  156. datetime.datetime(1000, 1, 1),
  157. '1000-01-01',
  158. 'Jan 1, 1000',
  159. np.datetime64('1000-01-01'),
  160. ]
  161. for invalid_date in invalid_dates:
  162. self.assertRaises(
  163. ValueError,
  164. tslib.array_to_datetime,
  165. np.array([invalid_date], dtype='object'),
  166. coerce=False,
  167. raise_=True,
  168. )
  169. self.assertTrue(
  170. np.array_equal(
  171. tslib.array_to_datetime(
  172. np.array([invalid_date], dtype='object'), coerce=True
  173. ),
  174. np.array([tslib.iNaT], dtype='M8[ns]')
  175. )
  176. )
  177. arr = np.array(['1/1/1000', '1/1/2000'], dtype=object)
  178. self.assert_numpy_array_equal(
  179. tslib.array_to_datetime(arr, coerce=True),
  180. np.array(
  181. [
  182. tslib.iNaT,
  183. '2000-01-01T00:00:00.000000000-0000'
  184. ],
  185. dtype='M8[ns]'
  186. )
  187. )
  188. def test_coerce_of_invalid_datetimes(self):
  189. arr = np.array(['01-01-2013', 'not_a_date', '1'], dtype=object)
  190. # Without coercing, the presence of any invalid dates prevents
  191. # any values from being converted
  192. self.assert_numpy_array_equal(tslib.array_to_datetime(arr), arr)
  193. # With coercing, the invalid dates becomes iNaT
  194. self.assert_numpy_array_equal(
  195. tslib.array_to_datetime(arr, coerce=True),
  196. np.array(
  197. [
  198. '2013-01-01T00:00:00.000000000-0000',
  199. tslib.iNaT,
  200. tslib.iNaT
  201. ],
  202. dtype='M8[ns]'
  203. )
  204. )
  205. def test_parsing_timezone_offsets(self):
  206. # All of these datetime strings with offsets are equivalent
  207. # to the same datetime after the timezone offset is added
  208. dt_strings = [
  209. '01-01-2013 08:00:00+08:00',
  210. '2013-01-01T08:00:00.000000000+0800',
  211. '2012-12-31T16:00:00.000000000-0800',
  212. '12-31-2012 23:00:00-01:00',
  213. ]
  214. expected_output = tslib.array_to_datetime(
  215. np.array(['01-01-2013 00:00:00'], dtype=object)
  216. )
  217. for dt_string in dt_strings:
  218. self.assert_numpy_array_equal(
  219. tslib.array_to_datetime(
  220. np.array([dt_string], dtype=object)
  221. ),
  222. expected_output
  223. )
  224. class TestTimestampNsOperations(tm.TestCase):
  225. def setUp(self):
  226. if _np_version_under1p7:
  227. raise nose.SkipTest('numpy >= 1.7 required')
  228. self.timestamp = Timestamp(datetime.datetime.utcnow())
  229. def assert_ns_timedelta(self, modified_timestamp, expected_value):
  230. value = self.timestamp.value
  231. modified_value = modified_timestamp.value
  232. self.assertEqual(modified_value - value, expected_value)
  233. def test_timedelta_ns_arithmetic(self):
  234. self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'ns'), -123)
  235. def test_timedelta_ns_based_arithmetic(self):
  236. self.assert_ns_timedelta(self.timestamp + np.timedelta64(1234567898, 'ns'), 1234567898)
  237. def test_timedelta_us_arithmetic(self):
  238. self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'us'), -123000)
  239. def test_timedelta_ns_arithmetic(self):
  240. time = self.timestamp + np.timedelta64(-123, 'ms')
  241. self.assert_ns_timedelta(time, -123000000)
  242. def test_nanosecond_string_parsing(self):
  243. self.timestamp = Timestamp('2013-05-01 07:15:45.123456789')
  244. self.assertEqual(self.timestamp.value, 1367392545123456000)
  245. def test_nat_arithmetic(self):
  246. # GH 6873
  247. nat = tslib.NaT
  248. t = Timestamp('2014-01-01')
  249. dt = datetime.datetime(2014, 1, 1)
  250. delta = datetime.timedelta(3600)
  251. # Timestamp / datetime
  252. for (left, right) in [(nat, nat), (nat, t), (dt, nat)]:
  253. # NaT + Timestamp-like should raise TypeError
  254. with tm.assertRaises(TypeError):
  255. left + right
  256. with tm.assertRaises(TypeError):
  257. right + left
  258. # NaT - Timestamp-like (or inverse) returns NaT
  259. self.assertTrue((left - right) is tslib.NaT)
  260. self.assertTrue((right - left) is tslib.NaT)
  261. # timedelta-like
  262. # offsets are tested in test_offsets.py
  263. for (left, right) in [(nat, delta)]:
  264. # NaT + timedelta-like returns NaT
  265. self.assertTrue((left + right) is tslib.NaT)
  266. # timedelta-like + NaT should raise TypeError
  267. with tm.assertRaises(TypeError):
  268. right + left
  269. self.assertTrue((left - right) is tslib.NaT)
  270. with tm.assertRaises(TypeError):
  271. right - left
  272. if _np_version_under1p7:
  273. self.assertEqual(nat + np.timedelta64(1, 'h'), tslib.NaT)
  274. with tm.assertRaises(TypeError):
  275. np.timedelta64(1, 'h') + nat
  276. self.assertEqual(nat - np.timedelta64(1, 'h'), tslib.NaT)
  277. with tm.assertRaises(TypeError):
  278. np.timedelta64(1, 'h') - nat
  279. class TestTslib(tm.TestCase):
  280. def test_intraday_conversion_factors(self):
  281. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('H'), False), 24)
  282. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('T'), False), 1440)
  283. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('S'), False), 86400)
  284. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('L'), False), 86400000)
  285. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('U'), False), 86400000000)
  286. self.assertEqual(period_asfreq(1, get_freq('D'), get_freq('N'), False), 86400000000000)
  287. self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('T'), False), 60)
  288. self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('S'), False), 3600)
  289. self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('L'), False), 3600000)
  290. self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('U'), False), 3600000000)
  291. self.assertEqual(period_asfreq(1, get_freq('H'), get_freq('N'), False), 3600000000000)
  292. self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('S'), False), 60)
  293. self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('L'), False), 60000)
  294. self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('U'), False), 60000000)
  295. self.assertEqual(period_asfreq(1, get_freq('T'), get_freq('N'), False), 60000000000)
  296. self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('L'), False), 1000)
  297. self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('U'), False), 1000000)
  298. self.assertEqual(period_asfreq(1, get_freq('S'), get_freq('N'), False), 1000000000)
  299. self.assertEqual(period_asfreq(1, get_freq('L'), get_freq('U'), False), 1000)
  300. self.assertEqual(period_asfreq(1, get_freq('L'), get_freq('N'), False), 1000000)
  301. self.assertEqual(period_asfreq(1, get_freq('U'), get_freq('N'), False), 1000)
  302. def test_period_ordinal_start_values(self):
  303. # information for 1.1.1970
  304. self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('Y')))
  305. self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('M')))
  306. self.assertEqual(1, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('W')))
  307. self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('D')))
  308. self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0, get_freq('B')))
  309. def test_period_ordinal_week(self):
  310. self.assertEqual(1, period_ordinal(1970, 1, 4, 0, 0, 0, 0, 0, get_freq('W')))
  311. self.assertEqual(2, period_ordinal(1970, 1, 5, 0, 0, 0, 0, 0, get_freq('W')))
  312. self.assertEqual(2284, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0, get_freq('W')))
  313. self.assertEqual(2285, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0, get_freq('W')))
  314. def test_period_ordinal_business_day(self):
  315. # Thursday
  316. self.assertEqual(11415, period_ordinal(2013, 10, 3, 0, 0, 0, 0, 0, get_freq('B')))
  317. # Friday
  318. self.assertEqual(11416, period_ordinal(2013, 10, 4, 0, 0, 0, 0, 0, get_freq('B')))
  319. # Saturday
  320. self.assertEqual(11417, period_ordinal(2013, 10, 5, 0, 0, 0, 0, 0, get_freq('B')))
  321. # Sunday
  322. self.assertEqual(11417, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0, get_freq('B')))
  323. # Monday
  324. self.assertEqual(11417, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0, get_freq('B')))
  325. # Tuesday
  326. self.assertEqual(11418, period_ordinal(2013, 10, 8, 0, 0, 0, 0, 0, get_freq('B')))
  327. class TestTimestampOps(tm.TestCase):
  328. def test_timestamp_and_datetime(self):
  329. self.assertEqual((Timestamp(datetime.datetime(2013, 10, 13)) - datetime.datetime(2013, 10, 12)).days, 1)
  330. self.assertEqual((datetime.datetime(2013, 10, 12) - Timestamp(datetime.datetime(2013, 10, 13))).days, -1)
  331. def test_timestamp_and_series(self):
  332. timestamp_series = Series(date_range('2014-03-17', periods=2, freq='D', tz='US/Eastern'))
  333. first_timestamp = timestamp_series[0]
  334. if not _np_version_under1p7:
  335. delta_series = Series([np.timedelta64(0, 'D'), np.timedelta64(1, 'D')])
  336. assert_series_equal(timestamp_series - first_timestamp, delta_series)
  337. assert_series_equal(first_timestamp - timestamp_series, -delta_series)
  338. def test_addition_subtraction_types(self):
  339. # Assert on the types resulting from Timestamp +/- various date/time objects
  340. datetime_instance = datetime.datetime(2014, 3, 4)
  341. timedelta_instance = datetime.timedelta(seconds=1)
  342. # build a timestamp with a frequency, since then it supports addition/subtraction of integers
  343. timestamp_instance = date_range(datetime_instance, periods=1, freq='D')[0]
  344. self.assertEqual(type(timestamp_instance + 1), Timestamp)
  345. self.assertEqual(type(timestamp_instance - 1), Timestamp)
  346. # Timestamp + datetime not supported, though subtraction is supported and yields timedelta
  347. self.assertEqual(type(timestamp_instance - datetime_instance), datetime.timedelta)
  348. self.assertEqual(type(timestamp_instance + timedelta_instance), Timestamp)
  349. self.assertEqual(type(timestamp_instance - timedelta_instance), Timestamp)
  350. if not _np_version_under1p7:
  351. # Timestamp +/- datetime64 not supported, so not tested (could possibly assert error raised?)
  352. timedelta64_instance = np.timedelta64(1, 'D')
  353. self.assertEqual(type(timestamp_instance + timedelta64_instance), Timestamp)
  354. self.assertEqual(type(timestamp_instance - timedelta64_instance), Timestamp)
  355. def test_addition_subtraction_preserve_frequency(self):
  356. timestamp_instance = date_range('2014-03-05', periods=1, freq='D')[0]
  357. timedelta_instance = datetime.timedelta(days=1)
  358. original_freq = timestamp_instance.freq
  359. self.assertEqual((timestamp_instance + 1).freq, original_freq)
  360. self.assertEqual((timestamp_instance - 1).freq, original_freq)
  361. self.assertEqual((timestamp_instance + timedelta_instance).freq, original_freq)
  362. self.assertEqual((timestamp_instance - timedelta_instance).freq, original_freq)
  363. if not _np_version_under1p7:
  364. timedelta64_instance = np.timedelta64(1, 'D')
  365. self.assertEqual((timestamp_instance + timedelta64_instance).freq, original_freq)
  366. self.assertEqual((timestamp_instance - timedelta64_instance).freq, original_freq)
  367. if __name__ == '__main__':
  368. nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
  369. exit=False)