Skip to content

Commit cc6ac5c

Browse files
jbrockmendelPingviinituutti
authored andcommitted
implement independent parts of pandas-dev#24024 (pandas-dev#24276)
* implement independent parts of pandas-dev#24024 * move monotonic checks up
1 parent aa3303a commit cc6ac5c

File tree

15 files changed

+136
-72
lines changed

15 files changed

+136
-72
lines changed

pandas/core/arrays/datetimelike.py

+21-5
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55

66
import numpy as np
77

8-
from pandas._libs import NaT, iNaT, lib
8+
from pandas._libs import NaT, algos, iNaT, lib
99
from pandas._libs.tslibs.period import (
1010
DIFFERENT_FREQ_INDEX, IncompatibleFrequency, Period)
1111
from pandas._libs.tslibs.timedeltas import Timedelta, delta_to_nanoseconds
@@ -155,6 +155,7 @@ class TimelikeOps(object):
155155
times
156156
157157
.. versionadded:: 0.24.0
158+
158159
nonexistent : 'shift', 'NaT', default 'raise'
159160
A nonexistent time does not exist in a particular timezone
160161
where clocks moved forward due to DST.
@@ -246,7 +247,7 @@ def _round(self, freq, mode, ambiguous, nonexistent):
246247
if 'tz' in attribs:
247248
attribs['tz'] = None
248249
return self._ensure_localized(
249-
self._shallow_copy(result, **attribs), ambiguous, nonexistent
250+
self._simple_new(result, **attribs), ambiguous, nonexistent
250251
)
251252

252253
@Appender((_round_doc + _round_example).format(op="round"))
@@ -310,6 +311,8 @@ def shape(self):
310311

311312
@property
312313
def size(self):
314+
# type: () -> int
315+
"""The number of elements in this array."""
313316
return np.prod(self.shape)
314317

315318
def __len__(self):
@@ -554,6 +557,21 @@ def _validate_frequency(cls, index, freq, **kwargs):
554557
'does not conform to passed frequency {passed}'
555558
.format(infer=inferred, passed=freq.freqstr))
556559

560+
# monotonicity/uniqueness properties are called via frequencies.infer_freq,
561+
# see GH#23789
562+
563+
@property
564+
def _is_monotonic_increasing(self):
565+
return algos.is_monotonic(self.asi8, timelike=True)[0]
566+
567+
@property
568+
def _is_monotonic_decreasing(self):
569+
return algos.is_monotonic(self.asi8, timelike=True)[1]
570+
571+
@property
572+
def _is_unique(self):
573+
return len(unique1d(self.asi8)) == len(self)
574+
557575
# ------------------------------------------------------------------
558576
# Arithmetic Methods
559577

@@ -661,9 +679,7 @@ def _add_nat(self):
661679
# and datetime dtypes
662680
result = np.zeros(len(self), dtype=np.int64)
663681
result.fill(iNaT)
664-
if is_timedelta64_dtype(self):
665-
return type(self)(result, freq=None)
666-
return type(self)(result, tz=self.tz, freq=None)
682+
return type(self)(result, dtype=self.dtype, freq=None)
667683

668684
def _sub_nat(self):
669685
"""

pandas/core/arrays/datetimes.py

+19-5
Original file line numberDiff line numberDiff line change
@@ -165,10 +165,23 @@ class DatetimeArrayMixin(dtl.DatetimeLikeArrayMixin,
165165
_data
166166
"""
167167
_typ = "datetimearray"
168+
169+
# define my properties & methods for delegation
168170
_bool_ops = ['is_month_start', 'is_month_end',
169171
'is_quarter_start', 'is_quarter_end', 'is_year_start',
170172
'is_year_end', 'is_leap_year']
171173
_object_ops = ['weekday_name', 'freq', 'tz']
174+
_field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
175+
'weekofyear', 'week', 'weekday', 'dayofweek',
176+
'dayofyear', 'quarter', 'days_in_month',
177+
'daysinmonth', 'microsecond',
178+
'nanosecond']
179+
_other_ops = ['date', 'time', 'timetz']
180+
_datetimelike_ops = _field_ops + _object_ops + _bool_ops + _other_ops
181+
_datetimelike_methods = ['to_period', 'tz_localize',
182+
'tz_convert',
183+
'normalize', 'strftime', 'round', 'floor',
184+
'ceil', 'month_name', 'day_name']
172185

173186
# dummy attribute so that datetime.__eq__(DatetimeArray) defers
174187
# by returning NotImplemented
@@ -527,7 +540,7 @@ def _add_offset(self, offset):
527540
"or DatetimeIndex", PerformanceWarning)
528541
result = self.astype('O') + offset
529542

530-
return type(self)(result, freq='infer')
543+
return type(self)._from_sequence(result, freq='infer')
531544

532545
def _sub_datetimelike_scalar(self, other):
533546
# subtract a datetime from myself, yielding a ndarray[timedelta64[ns]]
@@ -562,8 +575,8 @@ def _add_delta(self, delta):
562575
-------
563576
result : DatetimeArray
564577
"""
565-
new_values = dtl.DatetimeLikeArrayMixin._add_delta(self, delta)
566-
return type(self)(new_values, tz=self.tz, freq='infer')
578+
new_values = super(DatetimeArrayMixin, self)._add_delta(delta)
579+
return type(self)._from_sequence(new_values, tz=self.tz, freq='infer')
567580

568581
# -----------------------------------------------------------------
569582
# Timezone Conversion and Localization Methods
@@ -866,14 +879,15 @@ def normalize(self):
866879
dtype='datetime64[ns, Asia/Calcutta]', freq=None)
867880
"""
868881
if self.tz is None or timezones.is_utc(self.tz):
869-
not_null = self.notna()
882+
not_null = ~self.isna()
870883
DAY_NS = ccalendar.DAY_SECONDS * 1000000000
871884
new_values = self.asi8.copy()
872885
adjustment = (new_values[not_null] % DAY_NS)
873886
new_values[not_null] = new_values[not_null] - adjustment
874887
else:
875888
new_values = conversion.normalize_i8_timestamps(self.asi8, self.tz)
876-
return type(self)(new_values, freq='infer').tz_localize(self.tz)
889+
return type(self)._from_sequence(new_values,
890+
freq='infer').tz_localize(self.tz)
877891

878892
def to_period(self, freq=None):
879893
"""

pandas/core/arrays/period.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -336,7 +336,7 @@ def to_timestamp(self, freq=None, how='start'):
336336
new_data = self.asfreq(freq, how=how)
337337

338338
new_data = libperiod.periodarr_to_dt64arr(new_data.asi8, base)
339-
return DatetimeArrayMixin(new_data, freq='infer')
339+
return DatetimeArrayMixin._from_sequence(new_data, freq='infer')
340340

341341
# --------------------------------------------------------------------
342342
# Array-like / EA-Interface Methods

pandas/core/arrays/timedeltas.py

+17-22
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66

77
import numpy as np
88

9-
from pandas._libs import algos, lib, tslibs
9+
from pandas._libs import lib, tslibs
1010
from pandas._libs.tslibs import NaT, Timedelta, Timestamp, iNaT
1111
from pandas._libs.tslibs.fields import get_timedelta_field
1212
from pandas._libs.tslibs.timedeltas import (
@@ -15,15 +15,16 @@
1515
from pandas.util._decorators import Appender
1616

1717
from pandas.core.dtypes.common import (
18-
_TD_DTYPE, ensure_int64, is_datetime64_dtype, is_float_dtype,
18+
_NS_DTYPE, _TD_DTYPE, ensure_int64, is_datetime64_dtype, is_float_dtype,
1919
is_integer_dtype, is_list_like, is_object_dtype, is_scalar,
2020
is_string_dtype, is_timedelta64_dtype)
21+
from pandas.core.dtypes.dtypes import DatetimeTZDtype
2122
from pandas.core.dtypes.generic import (
2223
ABCDataFrame, ABCIndexClass, ABCSeries, ABCTimedeltaIndex)
2324
from pandas.core.dtypes.missing import isna
2425

2526
from pandas.core import ops
26-
from pandas.core.algorithms import checked_add_with_arr, unique1d
27+
from pandas.core.algorithms import checked_add_with_arr
2728
import pandas.core.common as com
2829

2930
from pandas.tseries.frequencies import to_offset
@@ -90,7 +91,7 @@ def wrapper(self, other):
9091

9192
else:
9293
try:
93-
other = type(self)(other)._data
94+
other = type(self)._from_sequence(other)._data
9495
except (ValueError, TypeError):
9596
return ops.invalid_comparison(self, other, op)
9697

@@ -112,6 +113,14 @@ def wrapper(self, other):
112113
class TimedeltaArrayMixin(dtl.DatetimeLikeArrayMixin, dtl.TimelikeOps):
113114
_typ = "timedeltaarray"
114115
__array_priority__ = 1000
116+
# define my properties & methods for delegation
117+
_other_ops = []
118+
_bool_ops = []
119+
_object_ops = ['freq']
120+
_field_ops = ['days', 'seconds', 'microseconds', 'nanoseconds']
121+
_datetimelike_ops = _field_ops + _object_ops + _bool_ops
122+
_datetimelike_methods = ["to_pytimedelta", "total_seconds",
123+
"round", "floor", "ceil"]
115124

116125
# Needed so that NaT.__richcmp__(DateTimeArray) operates pointwise
117126
ndim = 1
@@ -222,21 +231,6 @@ def _validate_fill_value(self, fill_value):
222231
"Got '{got}'.".format(got=fill_value))
223232
return fill_value
224233

225-
# monotonicity/uniqueness properties are called via frequencies.infer_freq,
226-
# see GH#23789
227-
228-
@property
229-
def _is_monotonic_increasing(self):
230-
return algos.is_monotonic(self.asi8, timelike=True)[0]
231-
232-
@property
233-
def _is_monotonic_decreasing(self):
234-
return algos.is_monotonic(self.asi8, timelike=True)[1]
235-
236-
@property
237-
def _is_unique(self):
238-
return len(unique1d(self.asi8)) == len(self)
239-
240234
# ----------------------------------------------------------------
241235
# Arithmetic Methods
242236

@@ -262,8 +256,8 @@ def _add_delta(self, delta):
262256
-------
263257
result : TimedeltaArray
264258
"""
265-
new_values = dtl.DatetimeLikeArrayMixin._add_delta(self, delta)
266-
return type(self)(new_values, freq='infer')
259+
new_values = super(TimedeltaArrayMixin, self)._add_delta(delta)
260+
return type(self)._from_sequence(new_values, freq='infer')
267261

268262
def _add_datetime_arraylike(self, other):
269263
"""
@@ -293,7 +287,8 @@ def _add_datetimelike_scalar(self, other):
293287
result = checked_add_with_arr(i8, other.value,
294288
arr_mask=self._isnan)
295289
result = self._maybe_mask_results(result)
296-
return DatetimeArrayMixin(result, tz=other.tz, freq=self.freq)
290+
dtype = DatetimeTZDtype(tz=other.tz) if other.tz else _NS_DTYPE
291+
return DatetimeArrayMixin(result, dtype=dtype, freq=self.freq)
297292

298293
def _addsub_offset_array(self, other, op):
299294
# Add or subtract Array-like of DateOffset objects

pandas/core/indexes/datetimes.py

+7-18
Original file line numberDiff line numberDiff line change
@@ -191,32 +191,21 @@ def _join_i8_wrapper(joinf, **kwargs):
191191
_tz = None
192192
_freq = None
193193
_comparables = ['name', 'freqstr', 'tz']
194-
_attributes = ['name', 'freq', 'tz']
194+
_attributes = ['name', 'tz', 'freq']
195195

196196
# dummy attribute so that datetime.__eq__(DatetimeArray) defers
197197
# by returning NotImplemented
198198
timetuple = None
199199

200-
# define my properties & methods for delegation
201-
_bool_ops = ['is_month_start', 'is_month_end',
202-
'is_quarter_start', 'is_quarter_end', 'is_year_start',
203-
'is_year_end', 'is_leap_year']
204-
_object_ops = ['weekday_name', 'freq', 'tz']
205-
_field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
206-
'weekofyear', 'week', 'weekday', 'dayofweek',
207-
'dayofyear', 'quarter', 'days_in_month',
208-
'daysinmonth', 'microsecond',
209-
'nanosecond']
210-
_other_ops = ['date', 'time', 'timetz']
211-
_datetimelike_ops = _field_ops + _object_ops + _bool_ops + _other_ops
212-
_datetimelike_methods = ['to_period', 'tz_localize',
213-
'tz_convert',
214-
'normalize', 'strftime', 'round', 'floor',
215-
'ceil', 'month_name', 'day_name']
216-
217200
_is_numeric_dtype = False
218201
_infer_as_myclass = True
219202

203+
# some things like freq inference make use of these attributes.
204+
_bool_ops = DatetimeArray._bool_ops
205+
_object_ops = DatetimeArray._object_ops
206+
_field_ops = DatetimeArray._field_ops
207+
_datetimelike_ops = DatetimeArray._datetimelike_ops
208+
220209
# --------------------------------------------------------------------
221210
# Constructors
222211

pandas/io/formats/format.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -873,6 +873,8 @@ def format_array(values, formatter, float_format=None, na_rep='NaN',
873873

874874
if is_datetime64_dtype(values.dtype):
875875
fmt_klass = Datetime64Formatter
876+
elif is_datetime64tz_dtype(values):
877+
fmt_klass = Datetime64TZFormatter
876878
elif is_timedelta64_dtype(values.dtype):
877879
fmt_klass = Timedelta64Formatter
878880
elif is_extension_array_dtype(values.dtype):
@@ -881,8 +883,6 @@ def format_array(values, formatter, float_format=None, na_rep='NaN',
881883
fmt_klass = FloatArrayFormatter
882884
elif is_integer_dtype(values.dtype):
883885
fmt_klass = IntArrayFormatter
884-
elif is_datetime64tz_dtype(values):
885-
fmt_klass = Datetime64TZFormatter
886886
else:
887887
fmt_klass = GenericArrayFormatter
888888

pandas/tests/indexes/datetimes/test_astype.py

+11
Original file line numberDiff line numberDiff line change
@@ -299,3 +299,14 @@ def test_to_period_nofreq(self):
299299
idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
300300
assert idx.freqstr is None
301301
tm.assert_index_equal(idx.to_period(), expected)
302+
303+
@pytest.mark.parametrize('tz', [None, 'US/Central'])
304+
def test_astype_array_fallback(self, tz):
305+
obj = pd.date_range("2000", periods=2, tz=tz)
306+
result = obj.astype(bool)
307+
expected = pd.Index(np.array([True, True]))
308+
tm.assert_index_equal(result, expected)
309+
310+
result = obj._data.astype(bool)
311+
expected = np.array([True, True])
312+
tm.assert_numpy_array_equal(result, expected)

pandas/tests/indexes/period/test_astype.py

+21
Original file line numberDiff line numberDiff line change
@@ -97,3 +97,24 @@ def test_astype_object2(self):
9797
for i in [0, 1, 3]:
9898
assert result_list[i] == expected_list[i]
9999
assert result_list[2] is pd.NaT
100+
101+
def test_astype_category(self):
102+
obj = pd.period_range("2000", periods=2)
103+
result = obj.astype('category')
104+
expected = pd.CategoricalIndex([pd.Period('2000-01-01', freq="D"),
105+
pd.Period('2000-01-02', freq="D")])
106+
tm.assert_index_equal(result, expected)
107+
108+
result = obj._data.astype('category')
109+
expected = expected.values
110+
tm.assert_categorical_equal(result, expected)
111+
112+
def test_astype_array_fallback(self):
113+
obj = pd.period_range("2000", periods=2)
114+
result = obj.astype(bool)
115+
expected = pd.Index(np.array([True, True]))
116+
tm.assert_index_equal(result, expected)
117+
118+
result = obj._data.astype(bool)
119+
expected = np.array([True, True])
120+
tm.assert_numpy_array_equal(result, expected)

pandas/tests/indexes/timedeltas/test_astype.py

+11
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
import pytest
55

66
import pandas.util.testing as tm
7+
import pandas as pd
78
from pandas import (
89
Float64Index, Index, Int64Index, NaT, Timedelta, TimedeltaIndex,
910
timedelta_range
@@ -77,3 +78,13 @@ def test_astype_raises(self, dtype):
7778
msg = 'Cannot cast TimedeltaIndex to dtype'
7879
with pytest.raises(TypeError, match=msg):
7980
idx.astype(dtype)
81+
82+
def test_astype_array_fallback(self):
83+
obj = pd.timedelta_range("1H", periods=2)
84+
result = obj.astype(bool)
85+
expected = pd.Index(np.array([True, True]))
86+
tm.assert_index_equal(result, expected)
87+
88+
result = obj._data.astype(bool)
89+
expected = np.array([True, True])
90+
tm.assert_numpy_array_equal(result, expected)

pandas/tests/io/json/test_pandas.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -1026,7 +1026,8 @@ def test_tz_range_is_utc(self):
10261026
dti = pd.DatetimeIndex(tz_range)
10271027
assert dumps(dti, iso_dates=True) == exp
10281028
df = DataFrame({'DT': dti})
1029-
assert dumps(df, iso_dates=True) == dfexp
1029+
result = dumps(df, iso_dates=True)
1030+
assert result == dfexp
10301031

10311032
tz_range = pd.date_range('2013-01-01 00:00:00', periods=2,
10321033
tz='US/Eastern')

pandas/tests/series/test_datetime_values.py

+10
Original file line numberDiff line numberDiff line change
@@ -555,3 +555,13 @@ def test_setitem_with_string_index(self):
555555
x['Date'] = date.today()
556556
assert x.Date == date.today()
557557
assert x['Date'] == date.today()
558+
559+
def test_setitem_with_different_tz(self):
560+
# GH#24024
561+
ser = pd.Series(pd.date_range('2000', periods=2, tz="US/Central"))
562+
ser[0] = pd.Timestamp("2000", tz='US/Eastern')
563+
expected = pd.Series([
564+
pd.Timestamp("2000-01-01 00:00:00-05:00", tz="US/Eastern"),
565+
pd.Timestamp("2000-01-02 00:00:00-06:00", tz="US/Central"),
566+
], dtype=object)
567+
tm.assert_series_equal(ser, expected)

pandas/tests/series/test_timeseries.py

+10
Original file line numberDiff line numberDiff line change
@@ -1023,3 +1023,13 @@ def test_get_level_values_box(self):
10231023
index = MultiIndex(levels=levels, codes=codes)
10241024

10251025
assert isinstance(index.get_level_values(0)[0], Timestamp)
1026+
1027+
def test_view_tz(self):
1028+
# GH#24024
1029+
ser = pd.Series(pd.date_range('2000', periods=4, tz='US/Central'))
1030+
result = ser.view("i8")
1031+
expected = pd.Series([946706400000000000,
1032+
946792800000000000,
1033+
946879200000000000,
1034+
946965600000000000])
1035+
tm.assert_series_equal(result, expected)

0 commit comments

Comments
 (0)