From 1c26375c0743a2cbdcfe14a62ad10806001cbee8 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Wed, 24 Oct 2018 13:50:01 -0500
Subject: [PATCH 01/23] CI: Pin CPython to 3.6.6 (#23322)

---
 ci/azure-windows-36.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/ci/azure-windows-36.yaml b/ci/azure-windows-36.yaml
index 656a6a31d92b4..d03a6cbbd662c 100644
--- a/ci/azure-windows-36.yaml
+++ b/ci/azure-windows-36.yaml
@@ -16,7 +16,7 @@ dependencies:
   - pyarrow
   - pytables
   - python-dateutil
-  - python=3.6.*
+  - python=3.6.6
   - pytz
   - scipy
   - thrift=0.10*

From c584ae7856cf9d6c8838b4e1c3cd2fa0bebfee98 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Thu, 25 Oct 2018 06:06:31 -0500
Subject: [PATCH 02/23] TST: Update sparse data generation (#23323)

There's a spurious failure on master when the first
is randomly chosen to be 0, since type(arr.fill_value) doesn't
match arr.dtype.type
---
 pandas/tests/extension/test_sparse.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/extension/test_sparse.py b/pandas/tests/extension/test_sparse.py
index ca0435141c2e2..6946da6fdc36d 100644
--- a/pandas/tests/extension/test_sparse.py
+++ b/pandas/tests/extension/test_sparse.py
@@ -12,7 +12,7 @@ def make_data(fill_value):
     if np.isnan(fill_value):
         data = np.random.uniform(size=100)
     else:
-        data = np.random.randint(0, 100, size=100)
+        data = np.random.randint(1, 100, size=100)
 
     data[2::3] = fill_value
     return data

From a20b09759f833cfd71e059319a41b9bd25a96751 Mon Sep 17 00:00:00 2001
From: Justin Zheng <justinzhengbc@gmail.com>
Date: Thu, 25 Oct 2018 04:26:13 -0700
Subject: [PATCH 03/23] BUG-23224 Fix PR 23237 / Integer NA creation from None
 (#23310)

---
 pandas/core/arrays/integer.py       | 2 +-
 pandas/tests/arrays/test_integer.py | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/pandas/core/arrays/integer.py b/pandas/core/arrays/integer.py
index 17e92c3976e2c..9e045a7785660 100644
--- a/pandas/core/arrays/integer.py
+++ b/pandas/core/arrays/integer.py
@@ -173,7 +173,7 @@ def coerce_to_array(values, dtype, mask=None, copy=False):
     values = np.array(values, copy=copy)
     if is_object_dtype(values):
         inferred_type = lib.infer_dtype(values)
-        if inferred_type is 'mixed' and isna(values).any():
+        if inferred_type is 'mixed' and isna(values).all():
             values = np.empty(len(values))
             values.fill(np.nan)
         elif inferred_type not in ['floating', 'integer',
diff --git a/pandas/tests/arrays/test_integer.py b/pandas/tests/arrays/test_integer.py
index e6dae0ffaec28..10961173d4b6b 100644
--- a/pandas/tests/arrays/test_integer.py
+++ b/pandas/tests/arrays/test_integer.py
@@ -560,7 +560,8 @@ def test_integer_array_constructor_copy():
         1.0,
         pd.date_range('20130101', periods=2),
         np.array(['foo']),
-        [[1, 2], [3, 4]]])
+        [[1, 2], [3, 4]],
+        [np.nan, {'a': 1}]])
 def test_to_integer_array_error(values):
     # error in converting existing arrays to IntegerArrays
     with pytest.raises(TypeError):

From 6b8e5e871dc4544db0e9a24463b1e64d1164147e Mon Sep 17 00:00:00 2001
From: Roman Imankulov <roman.imankulov@gmail.com>
Date: Thu, 25 Oct 2018 12:33:41 +0100
Subject: [PATCH 04/23] BUG: Let MultiIndex.set_levels accept any iterable
 (#23273) (#23291)

---
 doc/source/whatsnew/v0.24.0.txt            |  1 +
 pandas/core/indexes/multi.py               |  3 +++
 pandas/tests/indexes/multi/test_get_set.py | 14 ++++++++++++++
 3 files changed, 18 insertions(+)

diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index 4f17133ef4a8c..c85a6fd2270af 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -1091,6 +1091,7 @@ Indexing
 - Bug in :meth:`DataFrame.loc` when indexing with an :class:`IntervalIndex` (:issue:`19977`)
 - :class:`Index` no longer mangles ``None``, ``NaN`` and ``NaT``, i.e. they are treated as three different keys. However, for numeric Index all three are still coerced to a ``NaN`` (:issue:`22332`)
 - Bug in `scalar in Index` if scalar is a float while the ``Index`` is of integer dtype (:issue:`22085`)
+- Bug in `MultiIndex.set_levels` when levels value is not subscriptable (:issue:`23273`)
 
 Missing
 ^^^^^^^
diff --git a/pandas/core/indexes/multi.py b/pandas/core/indexes/multi.py
index 3cccb65503378..79ac32d2f6a0b 100644
--- a/pandas/core/indexes/multi.py
+++ b/pandas/core/indexes/multi.py
@@ -389,6 +389,9 @@ def set_levels(self, levels, level=None, inplace=False,
                    labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
                    names=[u'foo', u'bar'])
         """
+        if is_list_like(levels) and not isinstance(levels, Index):
+            levels = list(levels)
+
         if level is not None and not is_list_like(level):
             if not is_list_like(levels):
                 raise TypeError("Levels must be list-like")
diff --git a/pandas/tests/indexes/multi/test_get_set.py b/pandas/tests/indexes/multi/test_get_set.py
index 99ab54a83636c..ff2170839b012 100644
--- a/pandas/tests/indexes/multi/test_get_set.py
+++ b/pandas/tests/indexes/multi/test_get_set.py
@@ -414,3 +414,17 @@ def test_set_value_keeps_names():
     df.at[('grethe', '4'), 'one'] = 99.34
     assert df._is_copy is None
     assert df.index.names == ('Name', 'Number')
+
+
+def test_set_levels_with_iterable():
+    # GH23273
+    sizes = [1, 2, 3]
+    colors = ['black'] * 3
+    index = pd.MultiIndex.from_arrays([sizes, colors], names=['size', 'color'])
+
+    result = index.set_levels(map(int, ['3', '2', '1']), level='size')
+
+    expected_sizes = [3, 2, 1]
+    expected = pd.MultiIndex.from_arrays([expected_sizes, colors],
+                                         names=['size', 'color'])
+    tm.assert_index_equal(result, expected)

From 0a2d5019dc2b8f9521879f47a197076d9cef38ce Mon Sep 17 00:00:00 2001
From: Matthew Roeschke <emailformattr@gmail.com>
Date: Thu, 25 Oct 2018 04:46:29 -0700
Subject: [PATCH 05/23] API/ENH: tz_localize handling of nonexistent times:
 rename keyword + add shift option (#22644)

---
 doc/source/timeseries.rst                     | 32 ++++++++
 doc/source/whatsnew/v0.24.0.txt               |  2 +
 pandas/_libs/tslibs/conversion.pyx            | 82 +++++++++++--------
 pandas/_libs/tslibs/nattype.pyx               | 20 ++++-
 pandas/_libs/tslibs/timestamps.pyx            | 43 ++++++++--
 pandas/core/arrays/datetimes.py               | 49 ++++++++---
 pandas/core/generic.py                        | 29 +++++--
 .../tests/indexes/datetimes/test_timezones.py | 44 +++++++++-
 .../tests/scalar/timestamp/test_timezones.py  | 54 +++++++++++-
 pandas/tests/series/test_timezones.py         | 40 ++++++++-
 10 files changed, 330 insertions(+), 65 deletions(-)

diff --git a/doc/source/timeseries.rst b/doc/source/timeseries.rst
index 85b0abe421eb2..a52c80106f100 100644
--- a/doc/source/timeseries.rst
+++ b/doc/source/timeseries.rst
@@ -2357,6 +2357,38 @@ constructor as well as ``tz_localize``.
    # tz_convert(None) is identical with tz_convert('UTC').tz_localize(None)
    didx.tz_convert('UCT').tz_localize(None)
 
+.. _timeseries.timezone_nonexistent:
+
+Nonexistent Times when Localizing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A DST transition may also shift the local time ahead by 1 hour creating nonexistent
+local times. The behavior of localizing a timeseries with nonexistent times
+can be controlled by the ``nonexistent`` argument. The following options are available:
+
+* ``raise``: Raises a ``pytz.NonExistentTimeError`` (the default behavior)
+* ``NaT``: Replaces nonexistent times with ``NaT``
+* ``shift``: Shifts nonexistent times forward to the closest real time
+
+.. ipython:: python
+    dti = date_range(start='2015-03-29 01:30:00', periods=3, freq='H')
+    # 2:30 is a nonexistent time
+
+Localization of nonexistent times will raise an error by default.
+
+.. code-block:: ipython
+
+   In [2]: dti.tz_localize('Europe/Warsaw')
+   NonExistentTimeError: 2015-03-29 02:30:00
+
+Transform nonexistent times to ``NaT`` or the closest real time forward in time.
+
+.. ipython:: python
+    dti
+    dti.tz_localize('Europe/Warsaw', nonexistent='shift')
+    dti.tz_localize('Europe/Warsaw', nonexistent='NaT')
+
+
 .. _timeseries.timezone_series:
 
 TZ Aware Dtypes
diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index c85a6fd2270af..e4b31b21b11ac 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -205,6 +205,7 @@ Other Enhancements
 - New attribute :attr:`__git_version__` will return git commit sha of current build (:issue:`21295`).
 - Compatibility with Matplotlib 3.0 (:issue:`22790`).
 - Added :meth:`Interval.overlaps`, :meth:`IntervalArray.overlaps`, and :meth:`IntervalIndex.overlaps` for determining overlaps between interval-like objects (:issue:`21998`)
+- :meth:`Timestamp.tz_localize`, :meth:`DatetimeIndex.tz_localize`, and :meth:`Series.tz_localize` have gained the ``nonexistent`` argument for alternative handling of nonexistent times. See :ref:`timeseries.timezone_nonexsistent` (:issue:`8917`)
 
 .. _whatsnew_0240.api_breaking:
 
@@ -912,6 +913,7 @@ Deprecations
 - :meth:`FrozenNDArray.searchsorted` has deprecated the ``v`` parameter in favor of ``value`` (:issue:`14645`)
 - :func:`DatetimeIndex.shift` and :func:`PeriodIndex.shift` now accept ``periods`` argument instead of ``n`` for consistency with :func:`Index.shift` and :func:`Series.shift`. Using ``n`` throws a deprecation warning (:issue:`22458`, :issue:`22912`)
 - The ``fastpath`` keyword of the different Index constructors is deprecated (:issue:`23110`).
+- :meth:`Timestamp.tz_localize`, :meth:`DatetimeIndex.tz_localize`, and :meth:`Series.tz_localize` have deprecated the ``errors`` argument in favor of the ``nonexistent`` argument (:issue:`8917`)
 
 .. _whatsnew_0240.prior_deprecations:
 
diff --git a/pandas/_libs/tslibs/conversion.pyx b/pandas/_libs/tslibs/conversion.pyx
index d7eef546befbd..f9c604cd76472 100644
--- a/pandas/_libs/tslibs/conversion.pyx
+++ b/pandas/_libs/tslibs/conversion.pyx
@@ -1,5 +1,4 @@
 # -*- coding: utf-8 -*-
-
 import cython
 from cython import Py_ssize_t
 
@@ -44,6 +43,7 @@ from nattype cimport NPY_NAT, checknull_with_nat
 # Constants
 
 cdef int64_t DAY_NS = 86400000000000LL
+cdef int64_t HOURS_NS = 3600000000000
 NS_DTYPE = np.dtype('M8[ns]')
 TD_DTYPE = np.dtype('m8[ns]')
 
@@ -458,8 +458,7 @@ cdef _TSObject convert_str_to_tsobject(object ts, object tz, object unit,
                 if tz is not None:
                     # shift for localize_tso
                     ts = tz_localize_to_utc(np.array([ts], dtype='i8'), tz,
-                                            ambiguous='raise',
-                                            errors='raise')[0]
+                                            ambiguous='raise')[0]
 
         except OutOfBoundsDatetime:
             # GH#19382 for just-barely-OutOfBounds falling back to dateutil
@@ -826,7 +825,7 @@ def tz_convert(int64_t[:] vals, object tz1, object tz2):
 @cython.boundscheck(False)
 @cython.wraparound(False)
 def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
-                       object errors='raise'):
+                       object nonexistent=None):
     """
     Localize tzinfo-naive i8 to given time zone (using pytz). If
     there are ambiguities in the values, raise AmbiguousTimeError.
@@ -837,7 +836,10 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
     tz : tzinfo or None
     ambiguous : str, bool, or arraylike
         If arraylike, must have the same length as vals
-    errors : {"raise", "coerce"}, default "raise"
+    nonexistent : str
+        If arraylike, must have the same length as vals
+
+        .. versionadded:: 0.24.0
 
     Returns
     -------
@@ -849,16 +851,13 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
         ndarray ambiguous_array
         Py_ssize_t i, idx, pos, ntrans, n = len(vals)
         int64_t *tdata
-        int64_t v, left, right
+        int64_t v, left, right, val, v_left, v_right
         ndarray[int64_t] result, result_a, result_b, dst_hours
         npy_datetimestruct dts
         bint infer_dst = False, is_dst = False, fill = False
-        bint is_coerce = errors == 'coerce', is_raise = errors == 'raise'
+        bint shift = False, fill_nonexist = False
 
     # Vectorized version of DstTzInfo.localize
-
-    assert is_coerce or is_raise
-
     if tz == UTC or tz is None:
         return vals
 
@@ -888,39 +887,45 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
                              "the same size as vals")
         ambiguous_array = np.asarray(ambiguous)
 
+    if nonexistent == 'NaT':
+        fill_nonexist = True
+    elif nonexistent == 'shift':
+        shift = True
+    else:
+        assert nonexistent in ('raise', None), ("nonexistent must be one of"
+                                                " {'NaT', 'raise', 'shift'}")
+
     trans, deltas, typ = get_dst_info(tz)
 
     tdata = <int64_t*> cnp.PyArray_DATA(trans)
     ntrans = len(trans)
 
+    # Determine whether each date lies left of the DST transition (store in
+    # result_a) or right of the DST transition (store in result_b)
     result_a = np.empty(n, dtype=np.int64)
     result_b = np.empty(n, dtype=np.int64)
     result_a.fill(NPY_NAT)
     result_b.fill(NPY_NAT)
 
-    # left side
-    idx_shifted = (np.maximum(0, trans.searchsorted(
+    idx_shifted_left = (np.maximum(0, trans.searchsorted(
         vals - DAY_NS, side='right') - 1)).astype(np.int64)
 
-    for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
-
-        # timestamp falls to the left side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_a[i] = v
-
-    # right side
-    idx_shifted = (np.maximum(0, trans.searchsorted(
+    idx_shifted_right = (np.maximum(0, trans.searchsorted(
         vals + DAY_NS, side='right') - 1)).astype(np.int64)
 
     for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
+        val = vals[i]
+        v_left = val - deltas[idx_shifted_left[i]]
+        pos_left = bisect_right_i8(tdata, v_left, ntrans) - 1
+        # timestamp falls to the left side of the DST transition
+        if v_left + deltas[pos_left] == val:
+            result_a[i] = v_left
 
+        v_right = val - deltas[idx_shifted_right[i]]
+        pos_right = bisect_right_i8(tdata, v_right, ntrans) - 1
         # timestamp falls to the right side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_b[i] = v
+        if v_right + deltas[pos_right] == val:
+            result_b[i] = v_right
 
     if infer_dst:
         dst_hours = np.empty(n, dtype=np.int64)
@@ -935,7 +940,7 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
             stamp = _render_tstamp(vals[trans_idx])
             raise pytz.AmbiguousTimeError(
                 "Cannot infer dst time from %s as there "
-                "are no repeated times" % stamp)
+                "are no repeated times".format(stamp))
         # Split the array into contiguous chunks (where the difference between
         # indices is 1).  These are effectively dst transitions in different
         # years which is useful for checking that there is not an ambiguous
@@ -960,7 +965,7 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
                 if switch_idx.size > 1:
                     raise pytz.AmbiguousTimeError(
                         "There are %i dst switches when "
-                        "there should only be 1." % switch_idx.size)
+                        "there should only be 1.".format(switch_idx.size))
                 switch_idx = switch_idx[0] + 1
                 # Pull the only index and adjust
                 a_idx = grp[:switch_idx]
@@ -968,10 +973,11 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
                 dst_hours[grp] = np.hstack((result_a[a_idx], result_b[b_idx]))
 
     for i in range(n):
+        val = vals[i]
         left = result_a[i]
         right = result_b[i]
-        if vals[i] == NPY_NAT:
-            result[i] = vals[i]
+        if val == NPY_NAT:
+            result[i] = val
         elif left != NPY_NAT and right != NPY_NAT:
             if left == right:
                 result[i] = left
@@ -986,19 +992,27 @@ def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
                 elif fill:
                     result[i] = NPY_NAT
                 else:
-                    stamp = _render_tstamp(vals[i])
+                    stamp = _render_tstamp(val)
                     raise pytz.AmbiguousTimeError(
                         "Cannot infer dst time from %r, try using the "
-                        "'ambiguous' argument" % stamp)
+                        "'ambiguous' argument".format(stamp))
         elif left != NPY_NAT:
             result[i] = left
         elif right != NPY_NAT:
             result[i] = right
         else:
-            if is_coerce:
+            # Handle nonexistent times
+            if shift:
+                # Shift the nonexistent time forward to the closest existing
+                # time
+                remaining_minutes = val % HOURS_NS
+                new_local = val + (HOURS_NS - remaining_minutes)
+                delta_idx = trans.searchsorted(new_local, side='right') - 1
+                result[i] = new_local - deltas[delta_idx]
+            elif fill_nonexist:
                 result[i] = NPY_NAT
             else:
-                stamp = _render_tstamp(vals[i])
+                stamp = _render_tstamp(val)
                 raise pytz.NonExistentTimeError(stamp)
 
     return result
diff --git a/pandas/_libs/tslibs/nattype.pyx b/pandas/_libs/tslibs/nattype.pyx
index ae4f9c821b5d1..0eec84ecf8285 100644
--- a/pandas/_libs/tslibs/nattype.pyx
+++ b/pandas/_libs/tslibs/nattype.pyx
@@ -564,14 +564,26 @@ class NaTType(_NaT):
             - 'NaT' will return NaT for an ambiguous time
             - 'raise' will raise an AmbiguousTimeError for an ambiguous time
 
-        errors : 'raise', 'coerce', default 'raise'
+        nonexistent : 'shift', 'NaT', default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift' will shift the nonexistent time forward to the closest
+              existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : 'raise', 'coerce', default None
             - 'raise' will raise a NonExistentTimeError if a timestamp is not
                valid in the specified timezone (e.g. due to a transition from
-               or to DST time)
+               or to DST time). Use ``nonexistent='raise'`` instead.
             - 'coerce' will return NaT if the timestamp can not be converted
-              into the specified timezone
+              into the specified timezone. Use ``nonexistent='NaT'`` instead.
 
-              .. versionadded:: 0.19.0
+              .. deprecated:: 0.24.0
 
         Returns
         -------
diff --git a/pandas/_libs/tslibs/timestamps.pyx b/pandas/_libs/tslibs/timestamps.pyx
index 0c2753dbc6f28..08b0c5472549e 100644
--- a/pandas/_libs/tslibs/timestamps.pyx
+++ b/pandas/_libs/tslibs/timestamps.pyx
@@ -961,7 +961,8 @@ class Timestamp(_Timestamp):
     def is_leap_year(self):
         return bool(ccalendar.is_leapyear(self.year))
 
-    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
+    def tz_localize(self, tz, ambiguous='raise', nonexistent='raise',
+                    errors=None):
         """
         Convert naive Timestamp to local time zone, or remove
         timezone from tz-aware Timestamp.
@@ -978,14 +979,26 @@ class Timestamp(_Timestamp):
             - 'NaT' will return NaT for an ambiguous time
             - 'raise' will raise an AmbiguousTimeError for an ambiguous time
 
-        errors : 'raise', 'coerce', default 'raise'
+        nonexistent : 'shift', 'NaT', default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift' will shift the nonexistent time forward to the closest
+              existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : 'raise', 'coerce', default None
             - 'raise' will raise a NonExistentTimeError if a timestamp is not
                valid in the specified timezone (e.g. due to a transition from
-               or to DST time)
+               or to DST time). Use ``nonexistent='raise'`` instead.
             - 'coerce' will return NaT if the timestamp can not be converted
-              into the specified timezone
+              into the specified timezone. Use ``nonexistent='NaT'`` instead.
 
-              .. versionadded:: 0.19.0
+              .. deprecated:: 0.24.0
 
         Returns
         -------
@@ -999,13 +1012,31 @@ class Timestamp(_Timestamp):
         if ambiguous == 'infer':
             raise ValueError('Cannot infer offset with only one time.')
 
+        if errors is not None:
+            warnings.warn("The errors argument is deprecated and will be "
+                          "removed in a future release. Use "
+                          "nonexistent='NaT' or nonexistent='raise' "
+                          "instead.", FutureWarning)
+            if errors == 'coerce':
+                nonexistent = 'NaT'
+            elif errors == 'raise':
+                nonexistent = 'raise'
+            else:
+                raise ValueError("The errors argument must be either 'coerce' "
+                                 "or 'raise'.")
+
+        if nonexistent not in ('raise', 'NaT', 'shift'):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT' or 'shift'")
+
         if self.tzinfo is None:
             # tz naive, localize
             tz = maybe_get_tz(tz)
             if not is_string_object(ambiguous):
                 ambiguous = [ambiguous]
             value = tz_localize_to_utc(np.array([self.value], dtype='i8'), tz,
-                                       ambiguous=ambiguous, errors=errors)[0]
+                                       ambiguous=ambiguous,
+                                       nonexistent=nonexistent)[0]
             return Timestamp(value, tz=tz)
         else:
             if tz is None:
diff --git a/pandas/core/arrays/datetimes.py b/pandas/core/arrays/datetimes.py
index ac90483513af5..b6574c121c087 100644
--- a/pandas/core/arrays/datetimes.py
+++ b/pandas/core/arrays/datetimes.py
@@ -611,7 +611,8 @@ def tz_convert(self, tz):
         # No conversion since timestamps are all UTC to begin with
         return self._shallow_copy(tz=tz)
 
-    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
+    def tz_localize(self, tz, ambiguous='raise', nonexistent='raise',
+                    errors=None):
         """
         Localize tz-naive Datetime Array/Index to tz-aware
         Datetime Array/Index.
@@ -627,8 +628,7 @@ def tz_localize(self, tz, ambiguous='raise', errors='raise'):
         tz : string, pytz.timezone, dateutil.tz.tzfile or None
             Time zone to convert timestamps to. Passing ``None`` will
             remove the time zone information preserving local time.
-        ambiguous : str {'infer', 'NaT', 'raise'} or bool array,
-            default 'raise'
+        ambiguous : 'infer', 'NaT', bool array, default 'raise'
 
             - 'infer' will attempt to infer fall dst-transition hours based on
               order
@@ -639,15 +639,27 @@ def tz_localize(self, tz, ambiguous='raise', errors='raise'):
             - 'raise' will raise an AmbiguousTimeError if there are ambiguous
               times
 
-        errors : {'raise', 'coerce'}, default 'raise'
+        nonexistent : 'shift', 'NaT' default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift' will shift the nonexistent times forward to the closest
+              existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : {'raise', 'coerce'}, default None
 
             - 'raise' will raise a NonExistentTimeError if a timestamp is not
               valid in the specified time zone (e.g. due to a transition from
-              or to DST time)
+              or to DST time). Use ``nonexistent='raise'`` instead.
             - 'coerce' will return NaT if the timestamp can not be converted
-              to the specified time zone
+              to the specified time zone. Use ``nonexistent='NaT'`` instead.
 
-            .. versionadded:: 0.19.0
+            .. deprecated:: 0.24.0
 
         Returns
         -------
@@ -689,6 +701,23 @@ def tz_localize(self, tz, ambiguous='raise', errors='raise'):
                        '2018-03-03 09:00:00'],
                       dtype='datetime64[ns]', freq='D')
         """
+        if errors is not None:
+            warnings.warn("The errors argument is deprecated and will be "
+                          "removed in a future release. Use "
+                          "nonexistent='NaT' or nonexistent='raise' "
+                          "instead.", FutureWarning)
+            if errors == 'coerce':
+                nonexistent = 'NaT'
+            elif errors == 'raise':
+                nonexistent = 'raise'
+            else:
+                raise ValueError("The errors argument must be either 'coerce' "
+                                 "or 'raise'.")
+
+        if nonexistent not in ('raise', 'NaT', 'shift'):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT' or 'shift'")
+
         if self.tz is not None:
             if tz is None:
                 new_dates = conversion.tz_convert(self.asi8, 'UTC', self.tz)
@@ -698,9 +727,9 @@ def tz_localize(self, tz, ambiguous='raise', errors='raise'):
             tz = timezones.maybe_get_tz(tz)
             # Convert to UTC
 
-            new_dates = conversion.tz_localize_to_utc(self.asi8, tz,
-                                                      ambiguous=ambiguous,
-                                                      errors=errors)
+            new_dates = conversion.tz_localize_to_utc(
+                self.asi8, tz, ambiguous=ambiguous, nonexistent=nonexistent,
+            )
         new_dates = new_dates.view(_NS_DTYPE)
         return self._shallow_copy(new_dates, tz=tz)
 
diff --git a/pandas/core/generic.py b/pandas/core/generic.py
index 31b700abcfdb3..c24872d7c89e9 100644
--- a/pandas/core/generic.py
+++ b/pandas/core/generic.py
@@ -8627,7 +8627,7 @@ def _tz_convert(ax, tz):
         return result.__finalize__(self)
 
     def tz_localize(self, tz, axis=0, level=None, copy=True,
-                    ambiguous='raise'):
+                    ambiguous='raise', nonexistent='raise'):
         """
         Localize tz-naive TimeSeries to target time zone.
 
@@ -8649,6 +8649,17 @@ def tz_localize(self, tz, axis=0, level=None, copy=True,
             - 'NaT' will return NaT where there are ambiguous times
             - 'raise' will raise an AmbiguousTimeError if there are ambiguous
               times
+        nonexistent : 'shift', 'NaT', default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift' will shift the nonexistent times forward to the closest
+              existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
@@ -8658,10 +8669,14 @@ def tz_localize(self, tz, axis=0, level=None, copy=True,
         TypeError
             If the TimeSeries is tz-aware and tz is not None.
         """
+        if nonexistent not in ('raise', 'NaT', 'shift'):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT' or 'shift'")
+
         axis = self._get_axis_number(axis)
         ax = self._get_axis(axis)
 
-        def _tz_localize(ax, tz, ambiguous):
+        def _tz_localize(ax, tz, ambiguous, nonexistent):
             if not hasattr(ax, 'tz_localize'):
                 if len(ax) > 0:
                     ax_name = self._get_axis_name(axis)
@@ -8670,19 +8685,23 @@ def _tz_localize(ax, tz, ambiguous):
                 else:
                     ax = DatetimeIndex([], tz=tz)
             else:
-                ax = ax.tz_localize(tz, ambiguous=ambiguous)
+                ax = ax.tz_localize(
+                    tz, ambiguous=ambiguous, nonexistent=nonexistent
+                )
             return ax
 
         # if a level is given it must be a MultiIndex level or
         # equivalent to the axis name
         if isinstance(ax, MultiIndex):
             level = ax._get_level_number(level)
-            new_level = _tz_localize(ax.levels[level], tz, ambiguous)
+            new_level = _tz_localize(
+                ax.levels[level], tz, ambiguous, nonexistent
+            )
             ax = ax.set_levels(new_level, level=level)
         else:
             if level not in (None, 0, ax.name):
                 raise ValueError("The level {0} is not valid".format(level))
-            ax = _tz_localize(ax, tz, ambiguous)
+            ax = _tz_localize(ax, tz, ambiguous, nonexistent)
 
         result = self._constructor(self._data, copy=copy)
         result.set_axis(ax, axis=axis, inplace=True)
diff --git a/pandas/tests/indexes/datetimes/test_timezones.py b/pandas/tests/indexes/datetimes/test_timezones.py
index dc01f7ccbd496..1369783657f92 100644
--- a/pandas/tests/indexes/datetimes/test_timezones.py
+++ b/pandas/tests/indexes/datetimes/test_timezones.py
@@ -312,9 +312,13 @@ def test_dti_tz_localize_nonexistent_raise_coerce(self):
             index.tz_localize(tz=tz)
 
         with pytest.raises(pytz.NonExistentTimeError):
-            index.tz_localize(tz=tz, errors='raise')
+            with tm.assert_produces_warning(FutureWarning):
+                index.tz_localize(tz=tz, errors='raise')
 
-        result = index.tz_localize(tz=tz, errors='coerce')
+        with tm.assert_produces_warning(FutureWarning,
+                                        clear=FutureWarning,
+                                        check_stacklevel=False):
+            result = index.tz_localize(tz=tz, errors='coerce')
         test_times = ['2015-03-08 01:00-05:00', 'NaT',
                       '2015-03-08 03:00-04:00']
         dti = to_datetime(test_times, utc=True)
@@ -574,6 +578,42 @@ def test_dti_tz_localize_bdate_range(self):
         localized = dr.tz_localize(pytz.utc)
         tm.assert_index_equal(dr_utc, localized)
 
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    @pytest.mark.parametrize('method, exp', [
+        ['shift', '2015-03-29 03:00:00'],
+        ['NaT', pd.NaT],
+        ['raise', None],
+        ['foo', 'invalid']
+    ])
+    def test_dti_tz_localize_nonexistent(self, tz, method, exp):
+        # GH 8917
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        if method == 'raise':
+            with pytest.raises(pytz.NonExistentTimeError):
+                dti.tz_localize(tz, nonexistent=method)
+        elif exp == 'invalid':
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, nonexistent=method)
+        else:
+            result = dti.tz_localize(tz, nonexistent=method)
+            expected = DatetimeIndex([exp] * n, tz=tz)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_dti_tz_localize_errors_deprecation(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, errors='foo')
+            # make sure errors='coerce' gets mapped correctly to nonexistent
+            result = dti.tz_localize(tz, errors='coerce')
+            expected = dti.tz_localize(tz, nonexistent='NaT')
+            tm.assert_index_equal(result, expected)
+
     # -------------------------------------------------------------
     # DatetimeIndex.normalize
 
diff --git a/pandas/tests/scalar/timestamp/test_timezones.py b/pandas/tests/scalar/timestamp/test_timezones.py
index 8cebfafeae82a..827ad3581cd49 100644
--- a/pandas/tests/scalar/timestamp/test_timezones.py
+++ b/pandas/tests/scalar/timestamp/test_timezones.py
@@ -79,20 +79,44 @@ def test_tz_localize_ambiguous(self):
         ('2015-03-08 02:30', 'US/Pacific'),
         ('2015-03-29 02:00', 'Europe/Paris'),
         ('2015-03-29 02:30', 'Europe/Belgrade')])
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
     def test_tz_localize_nonexistent(self, stamp, tz):
         # GH#13057
         ts = Timestamp(stamp)
         with pytest.raises(NonExistentTimeError):
             ts.tz_localize(tz)
+        # GH 22644
         with pytest.raises(NonExistentTimeError):
-            ts.tz_localize(tz, errors='raise')
-        assert ts.tz_localize(tz, errors='coerce') is NaT
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize(tz, errors='raise')
+        with tm.assert_produces_warning(FutureWarning):
+            assert ts.tz_localize(tz, errors='coerce') is NaT
 
     def test_tz_localize_errors_ambiguous(self):
         # GH#13057
         ts = Timestamp('2015-11-1 01:00')
         with pytest.raises(AmbiguousTimeError):
-            ts.tz_localize('US/Pacific', errors='coerce')
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize('US/Pacific', errors='coerce')
+
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_tz_localize_errors_invalid_arg(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        ts = Timestamp('2015-03-29 02:00:00')
+        with pytest.raises(ValueError):
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize(tz, errors='foo')
+
+    def test_tz_localize_errors_coerce(self):
+        # GH 22644
+        # make sure errors='coerce' gets mapped correctly to nonexistent
+        tz = 'Europe/Warsaw'
+        ts = Timestamp('2015-03-29 02:00:00')
+        with tm.assert_produces_warning(FutureWarning):
+            result = ts.tz_localize(tz, errors='coerce')
+        expected = ts.tz_localize(tz, nonexistent='NaT')
+        assert result is expected
 
     @pytest.mark.parametrize('stamp', ['2014-02-01 09:00', '2014-07-08 09:00',
                                        '2014-11-01 17:00', '2014-11-05 00:00'])
@@ -158,6 +182,30 @@ def test_timestamp_tz_localize(self, tz):
         assert result.hour == expected.hour
         assert result == expected
 
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    def test_timestamp_tz_localize_nonexistent_shift(self, tz):
+        # GH 8917
+        ts = Timestamp('2015-03-29 02:20:00')
+        result = ts.tz_localize(tz, nonexistent='shift')
+        expected = Timestamp('2015-03-29 03:00:00').tz_localize(tz)
+        assert result == expected
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    def test_timestamp_tz_localize_nonexistent_NaT(self, tz):
+        # GH 8917
+        ts = Timestamp('2015-03-29 02:20:00')
+        result = ts.tz_localize(tz, nonexistent='NaT')
+        assert result is NaT
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    def test_timestamp_tz_localize_nonexistent_raise(self, tz):
+        # GH 8917
+        ts = Timestamp('2015-03-29 02:20:00')
+        with pytest.raises(pytz.NonExistentTimeError):
+            ts.tz_localize(tz, nonexistent='raise')
+        with pytest.raises(ValueError):
+            ts.tz_localize(tz, nonexistent='foo')
+
     # ------------------------------------------------------------------
     # Timestamp.tz_convert
 
diff --git a/pandas/tests/series/test_timezones.py b/pandas/tests/series/test_timezones.py
index 472b2c5644fa5..8c1ea6bff5f4d 100644
--- a/pandas/tests/series/test_timezones.py
+++ b/pandas/tests/series/test_timezones.py
@@ -13,7 +13,7 @@
 from pandas._libs.tslibs import timezones, conversion
 from pandas.compat import lrange
 from pandas.core.indexes.datetimes import date_range
-from pandas import Series, Timestamp, DatetimeIndex, Index
+from pandas import Series, Timestamp, DatetimeIndex, Index, NaT
 
 
 class TestSeriesTimezones(object):
@@ -33,6 +33,21 @@ def test_series_tz_localize(self):
         tm.assert_raises_regex(TypeError, 'Already tz-aware',
                                ts.tz_localize, 'US/Eastern')
 
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_tz_localize_errors_deprecation(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        n = 60
+        rng = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        ts = Series(rng)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            with pytest.raises(ValueError):
+                ts.dt.tz_localize(tz, errors='foo')
+            # make sure errors='coerce' gets mapped correctly to nonexistent
+            result = ts.dt.tz_localize(tz, errors='coerce')
+            expected = ts.dt.tz_localize(tz, nonexistent='NaT')
+            tm.assert_series_equal(result, expected)
+
     def test_series_tz_localize_ambiguous_bool(self):
         # make sure that we are correctly accepting bool values as ambiguous
 
@@ -60,6 +75,29 @@ def test_series_tz_localize_ambiguous_bool(self):
         result = ser.dt.tz_localize('US/Central', ambiguous=[False])
         tm.assert_series_equal(result, expected1)
 
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    @pytest.mark.parametrize('method, exp', [
+        ['shift', '2015-03-29 03:00:00'],
+        ['NaT', NaT],
+        ['raise', None],
+        ['foo', 'invalid']
+    ])
+    def test_series_tz_localize_nonexistent(self, tz, method, exp):
+        # GH 8917
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        s = Series(1, dti)
+        if method == 'raise':
+            with pytest.raises(pytz.NonExistentTimeError):
+                s.tz_localize(tz, nonexistent=method)
+        elif exp == 'invalid':
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, nonexistent=method)
+        else:
+            result = s.tz_localize(tz, nonexistent=method)
+            expected = Series(1, index=DatetimeIndex([exp] * n, tz=tz))
+            tm.assert_series_equal(result, expected)
+
     @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
     def test_series_tz_localize_empty(self, tzstr):
         # GH#2248

From c76173b5ff34a407a88f4b1e68b784c4bd410eb3 Mon Sep 17 00:00:00 2001
From: Krishna <prekrish2005@gmail.com>
Date: Thu, 25 Oct 2018 17:54:23 +0100
Subject: [PATCH 06/23] DOC: Added Examples for Series max (#23298)

---
 pandas/core/generic.py | 45 +++++++++++++++++++++++++++++++++++++++---
 1 file changed, 42 insertions(+), 3 deletions(-)

diff --git a/pandas/core/generic.py b/pandas/core/generic.py
index c24872d7c89e9..ceed4c3083471 100644
--- a/pandas/core/generic.py
+++ b/pandas/core/generic.py
@@ -9381,7 +9381,7 @@ def compound(self, axis=None, skipna=None, level=None):
             """This method returns the maximum of the values in the object.
             If you want the *index* of the maximum, use ``idxmax``. This is
             the equivalent of the ``numpy.ndarray`` method ``argmax``.""",
-            nanops.nanmax)
+            nanops.nanmax, _max_examples)
         cls.min = _make_stat_function(
             cls, 'min', name, name2, axis_descr,
             """This method returns the minimum of the values in the object.
@@ -10229,6 +10229,44 @@ def _doc_parms(cls):
 nan
 """
 
+_max_examples = """\
+Examples
+--------
+``MultiIndex`` series example of monthly rainfall
+
+>>> index = pd.MultiIndex.from_product(
+...     [['London', 'New York'], ['Jun', 'Jul', 'Aug']],
+...     names=['city', 'month'])
+>>> s = pd.Series([47, 35, 54, 112, 117, 113], index=index)
+>>> s
+city      month
+London    Jun       47
+          Jul       35
+          Aug       54
+New York  Jun      112
+          Jul      117
+          Aug      113
+dtype: int64
+
+>>> s.max()
+117
+
+Max using level names, as well as indices
+
+>>> s.max(level='city')
+city
+London       54
+New York    117
+dtype: int64
+
+>>> s.max(level=1)
+month
+Jun    112
+Jul    117
+Aug    113
+dtype: int64
+"""
+
 
 _min_count_stub = """\
 min_count : int, default 0
@@ -10266,9 +10304,10 @@ def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
     return set_function_name(stat_func, name, cls)
 
 
-def _make_stat_function(cls, name, name1, name2, axis_descr, desc, f):
+def _make_stat_function(cls, name, name1, name2, axis_descr, desc, f,
+                        examples=''):
     @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
-                  axis_descr=axis_descr, min_count='', examples='')
+                  axis_descr=axis_descr, min_count='', examples=examples)
     @Appender(_num_doc)
     def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
                   **kwargs):

From ed294301318fae52ab7993ec57aab99f4630e985 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Thu, 25 Oct 2018 17:38:54 -0500
Subject: [PATCH 07/23] REF: Make PeriodArray an ExtensionArray (#22862)

* WIP: PeriodArray

* WIP

* remove debug

* Just moves

* PeriodArray.shift definition

* _data type

* clean

* accessor wip

* some more wip

* tshift, shift

* Arithmetic

* repr changes

* wip

* freq setter

* Added disabled ops

* copy

* Support concat

* object ctor

* Updates

* lint

* lint

* wip

* more wip

* array-setitem

* wip

* wip

* Use ._tshift internally for datetimelike ops

In preperation for PeriodArray / DatetimeArray / TimedeltaArray.

Index.shift has a different meaning from ExtensionArray.shift.

- Index.shift pointwise shifts each element by some amount
- ExtensionArray.shift shits the *position* of each value in the array
  padding the end with NA

This is going to get confusing. This PR tries to avoid some of that by
internally using a new `_tshift` method (time-shift) when we want to do pointwise
shifting of each value. Places that know they want that behavior (like in the
datetimelike ops) should use that.

* deep

* Squashed commit of the following:

commit 23e5cfca21fae0a74d867073096b7fb76ab332fe
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 13:10:41 2018 -0500

    Use ._tshift internally for datetimelike ops

    In preperation for PeriodArray / DatetimeArray / TimedeltaArray.

    Index.shift has a different meaning from ExtensionArray.shift.

    - Index.shift pointwise shifts each element by some amount
    - ExtensionArray.shift shits the *position* of each value in the array
      padding the end with NA

    This is going to get confusing. This PR tries to avoid some of that by
    internally using a new `_tshift` method (time-shift) when we want to do pointwise
    shifting of each value. Places that know they want that behavior (like in the
    datetimelike ops) should use that.

commit 1d9f76c5055d1ef31ce76134e88b5568a119f498
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 17:11:11 2018 +0200

    CLN: remove Index._to_embed (#22879)

    * CLN: remove Index._to_embed

    * pep8

commit 6247da0db4835ff723126640145b4fad3ce17343
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 08:50:41 2018 -0500

    Provide default implementation for `data_repated` (#22935)

commit 5ce06b5bdb8c44043c6463bf8ce3da758800a189
Author: Matthew Roeschke <emailformattr@gmail.com>
Date:   Mon Oct 1 14:22:20 2018 -0700

     BUG: to_datetime preserves name of Index argument in the result (#22918)

    * BUG: to_datetime preserves name of Index argument in the result

    * correct test

* Squashed commit of the following:

commit bccfc3f8d821d739892ea0bc6eca88e9ffb04434
Merge: d65980ec6 9caf04836
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 13:47:48 2018 -0500

    Merge remote-tracking branch 'upstream/master' into period-dtype-type

commit 9caf04836ad34ca17da7b86ba7120cca58ce142a
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 13:25:22 2018 -0500

    CI: change windows vm image (#22948)

commit d65980ec629558bfc205316ce6be01daecb54a9d
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:46:38 2018 -0500

    typo

commit e5c61fcab619dde608add7a2b33bb51d100ebfaf
Merge: d7a8e1b86 1d9f76c50
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:57:59 2018 -0500

    Merge remote-tracking branch 'upstream/master' into period-dtype-type

commit d7a8e1b8686024b3c891d01ce267ccbfd1beabb9
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:57:56 2018 -0500

    Fixed

commit 598cc622d957ecba6cbb76c72ef3aeea98f55526
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:32:22 2018 -0500

    doc note

commit 83db05c7ddec7a87ff77430ab686873b8a329a0f
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:28:52 2018 -0500

    updates

commit 1d9f76c5055d1ef31ce76134e88b5568a119f498
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 17:11:11 2018 +0200

    CLN: remove Index._to_embed (#22879)

    * CLN: remove Index._to_embed

    * pep8

commit 6247da0db4835ff723126640145b4fad3ce17343
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 08:50:41 2018 -0500

    Provide default implementation for `data_repated` (#22935)

commit f07ab807e5eb393121197307de5718db429b71a8
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 06:22:27 2018 -0500

    str, bytes

commit 8a8bdb05008ed52fe0eb8d4168347bc2af116b4a
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 21:40:59 2018 -0500

    import at top

commit 99bafdd5513c7091e88416c725690605d9e808f4
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 21:38:12 2018 -0500

    Update type for PeriodDtype

    Removed unused IntervalDtypeType

commit 5ce06b5bdb8c44043c6463bf8ce3da758800a189
Author: Matthew Roeschke <emailformattr@gmail.com>
Date:   Mon Oct 1 14:22:20 2018 -0700

     BUG: to_datetime preserves name of Index argument in the result (#22918)

    * BUG: to_datetime preserves name of Index argument in the result

    * correct test

* fixup

* The rest of the EA tests

* docs

* rename to time_shift

* Squashed commit of the following:

commit 11a0d938cdaf7482546691519577b5dd28f69aac
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:26:34 2018 -0500

    typerror

commit a0cd5e79eb06ac71cf2f510b1a2122bc2b21fcf0
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:25:38 2018 -0500

    TypeError for Series

commit 2247461ec0b1017db320cb8581337cba0b5c6679
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:29:29 2018 -0500

    Test op(Series[EA], EA])

commit c9fe5d318d7077f99413532cdaf392ae3ea9cd2c
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:21:33 2018 -0500

    make strict

commit 7ef697cffdcd2f8d701de3cdfd2e6897358effbf
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:14:52 2018 -0500

    Use super

commit 35d42133acbcb3c25308b1c10e0e2dc3fa1052b6
Merge: 0671e7d67 ee808033b
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:11:05 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit ee808033bd5c546e7439a06d2ed37b57c9e66844
Author: Matthew Roeschke <emailformattr@gmail.com>
Date:   Wed Oct 3 08:25:44 2018 -0700

     BUG: Correctly weekly resample over DST (#22941)

    * test resample fix

    * move the localization until needed

    * BUG: Correctly weekly resample over DST

    * Move whatsnew to new section

commit fea27f0736a4b8f6626da60a6abc2f6e26b8a365
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Wed Oct 3 08:49:44 2018 -0500

    CI: pin moto to 1.3.4 (#22959)

commit 15d32bbad832908c9d06a9019e613bb6b35d6878
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Wed Oct 3 04:32:35 2018 -0700

    [CLN] Dispatch (some) Frame ops to Series, avoiding _data.eval (#22019)

    * avoid casting to object dtype in mixed-type frames

    * Dispatch to Series ops in _combine_match_columns

    * comment

    * docstring

    * flake8 fixup

    * dont bother with try_cast_result

    * revert non-central change

    * simplify

    * revert try_cast_results

    * revert non-central changes

    * Fixup typo syntaxerror

    * simplify assertion

    * use dispatch_to_series in combine_match_columns

    * Pass unwrapped op where appropriate

    * catch correct error

    * whatsnew note

    * comment

    * whatsnew section

    * remove unnecessary tester

    * doc fixup

commit 3e3256bb6038111812b4b28f6b3b049214d83d2d
Author: alimcmaster1 <alimcmaster1@gmail.com>
Date:   Wed Oct 3 12:23:22 2018 +0100

    Allow passing a mask to NanOps (#22865)

commit e756e991d57c2656906d0a3e8fc76950844e3f3e
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Wed Oct 3 02:19:27 2018 -0700

    CLN: Use is_period_dtype instead of ABCPeriodIndex checks (#22958)

commit 03181f0569c8b1f93f620a2986b4f174f9b6179b
Author: Wenhuan <lixx0880@gmail.com>
Date:   Wed Oct 3 15:28:07 2018 +0800

    BUG: fix Series(extension array) + extension array values addition (#22479)

commit 04ea51ddf7623b897aaaf2e504952d3c11e88205
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Wed Oct 3 09:24:36 2018 +0200

    CLN: small clean-up of IntervalIndex (#22956)

commit b0f9a104f323d687a56ea878ff78ff005f37b42d
Author: Tony Tao <34781056+tonytao2012@users.noreply.github.com>
Date:   Tue Oct 2 19:01:08 2018 -0500

    DOC GH22893 Fix docstring of groupby in pandas/core/generic.py (#22920)

commit 08ecba8dab4a35ad3cad89fe02c7240674938b97
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Tue Oct 2 14:22:53 2018 -0700

    BUG: fix DataFrame+DataFrame op with timedelta64 dtype (#22696)

commit c44bad24996f9e747f2119fa0c6a90d893f6e2aa
Author: Pamela Wu <pambot@users.noreply.github.com>
Date:   Tue Oct 2 17:16:25 2018 -0400

    CLN GH22873 Replace base excepts in pandas/core (#22901)

commit 8e749a33b5f814bded42044a4182449d5d6c8213
Author: Pamela Wu <pambot@users.noreply.github.com>
Date:   Tue Oct 2 17:14:48 2018 -0400

    CLN GH22874 replace bare excepts in pandas/io/pytables.py (#22919)

commit 1102a33d9776ed316cade079e22be6daa76c9e42
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 22:31:36 2018 +0200

    DOC/CLN: clean-up shared_docs in generic.py (#20074)

commit 9caf04836ad34ca17da7b86ba7120cca58ce142a
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 13:25:22 2018 -0500

    CI: change windows vm image (#22948)

commit 0671e7d67df8b0aa258fd864ef5f3169fe0ffc55
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:10:42 2018 -0500

    Fixup

commit 1b4261f41c70379fa868866bc77e7a31c43baa5d
Merge: c92a4a899 1d9f76c50
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:58:43 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit 1d9f76c5055d1ef31ce76134e88b5568a119f498
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 17:11:11 2018 +0200

    CLN: remove Index._to_embed (#22879)

    * CLN: remove Index._to_embed

    * pep8

commit 6247da0db4835ff723126640145b4fad3ce17343
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 08:50:41 2018 -0500

    Provide default implementation for `data_repated` (#22935)

commit c92a4a899b8d5e5e6a0479f390a604dc9f624f89
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:56:15 2018 -0500

    Update old test

commit 52538fa03a8c9722ab5c86c88419105b6ebfe5a1
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:51:48 2018 -0500

    BUG: divmod return type

commit 5ce06b5bdb8c44043c6463bf8ce3da758800a189
Author: Matthew Roeschke <emailformattr@gmail.com>
Date:   Mon Oct 1 14:22:20 2018 -0700

     BUG: to_datetime preserves name of Index argument in the result (#22918)

    * BUG: to_datetime preserves name of Index argument in the result

    * correct test

* Squashed commit of the following:

commit 7714e79a512f5d13f52c286458fcc9bac8b40bd0
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 10:13:06 2018 -0500

    Always return ndarray

commit 1921c6f5d00e0a9a5da2ce8e628b2c6328ee215e
Merge: 01f736696 fea27f073
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 09:50:30 2018 -0500

    Merge remote-tracking branch 'upstream/master' into combine-exception

commit fea27f0736a4b8f6626da60a6abc2f6e26b8a365
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Wed Oct 3 08:49:44 2018 -0500

    CI: pin moto to 1.3.4 (#22959)

commit 15d32bbad832908c9d06a9019e613bb6b35d6878
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Wed Oct 3 04:32:35 2018 -0700

    [CLN] Dispatch (some) Frame ops to Series, avoiding _data.eval (#22019)

    * avoid casting to object dtype in mixed-type frames

    * Dispatch to Series ops in _combine_match_columns

    * comment

    * docstring

    * flake8 fixup

    * dont bother with try_cast_result

    * revert non-central change

    * simplify

    * revert try_cast_results

    * revert non-central changes

    * Fixup typo syntaxerror

    * simplify assertion

    * use dispatch_to_series in combine_match_columns

    * Pass unwrapped op where appropriate

    * catch correct error

    * whatsnew note

    * comment

    * whatsnew section

    * remove unnecessary tester

    * doc fixup

commit 3e3256bb6038111812b4b28f6b3b049214d83d2d
Author: alimcmaster1 <alimcmaster1@gmail.com>
Date:   Wed Oct 3 12:23:22 2018 +0100

    Allow passing a mask to NanOps (#22865)

commit e756e991d57c2656906d0a3e8fc76950844e3f3e
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Wed Oct 3 02:19:27 2018 -0700

    CLN: Use is_period_dtype instead of ABCPeriodIndex checks (#22958)

commit 03181f0569c8b1f93f620a2986b4f174f9b6179b
Author: Wenhuan <lixx0880@gmail.com>
Date:   Wed Oct 3 15:28:07 2018 +0800

    BUG: fix Series(extension array) + extension array values addition (#22479)

commit 04ea51ddf7623b897aaaf2e504952d3c11e88205
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Wed Oct 3 09:24:36 2018 +0200

    CLN: small clean-up of IntervalIndex (#22956)

commit b0f9a104f323d687a56ea878ff78ff005f37b42d
Author: Tony Tao <34781056+tonytao2012@users.noreply.github.com>
Date:   Tue Oct 2 19:01:08 2018 -0500

    DOC GH22893 Fix docstring of groupby in pandas/core/generic.py (#22920)

commit 08ecba8dab4a35ad3cad89fe02c7240674938b97
Author: jbrockmendel <jbrockmendel@gmail.com>
Date:   Tue Oct 2 14:22:53 2018 -0700

    BUG: fix DataFrame+DataFrame op with timedelta64 dtype (#22696)

commit c44bad24996f9e747f2119fa0c6a90d893f6e2aa
Author: Pamela Wu <pambot@users.noreply.github.com>
Date:   Tue Oct 2 17:16:25 2018 -0400

    CLN GH22873 Replace base excepts in pandas/core (#22901)

commit 8e749a33b5f814bded42044a4182449d5d6c8213
Author: Pamela Wu <pambot@users.noreply.github.com>
Date:   Tue Oct 2 17:14:48 2018 -0400

    CLN GH22874 replace bare excepts in pandas/io/pytables.py (#22919)

commit 1102a33d9776ed316cade079e22be6daa76c9e42
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 22:31:36 2018 +0200

    DOC/CLN: clean-up shared_docs in generic.py (#20074)

commit 01f73669666f577fe141f5066646c4253408d3b8
Merge: 5372134ea 9caf04836
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 13:50:28 2018 -0500

    Merge remote-tracking branch 'upstream/master' into combine-exception

commit 9caf04836ad34ca17da7b86ba7120cca58ce142a
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 13:25:22 2018 -0500

    CI: change windows vm image (#22948)

commit 5372134ea2d22c90fff4b5830464a8f2c9932407
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:35:07 2018 -0500

    fixed move

commit ce1a3c6b112a6228847f9c622ef8246c671f7170
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:32:11 2018 -0500

    fixed move

commit b9c7e4b2c0577fed6601e4f6e27974b943f280da
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:28:57 2018 -0500

    remove old note

commit a4a2933117c493394a5656c887a22ea02e94093f
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:24:48 2018 -0500

    handle test

commit be63feb818b1e39d0f711d55c1eac809a03ee061
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:19:17 2018 -0500

    move test

commit 0eef0cfcdb17caed9cdddce03cb5d07924225375
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:18:18 2018 -0500

    move back

commit 2183f7bf71a90661877c87fe04dcd52efa481184
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:17:28 2018 -0500

    api

commit 85fc5d83a4754fb46e900d51491f92024a3ff4b8
Merge: 9059c0d23 1d9f76c50
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:15:52 2018 -0500

    Merge remote-tracking branch 'upstream/master' into combine-exception

commit 1d9f76c5055d1ef31ce76134e88b5568a119f498
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Tue Oct 2 17:11:11 2018 +0200

    CLN: remove Index._to_embed (#22879)

    * CLN: remove Index._to_embed

    * pep8

commit 6247da0db4835ff723126640145b4fad3ce17343
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Tue Oct 2 08:50:41 2018 -0500

    Provide default implementation for `data_repated` (#22935)

commit 9059c0d23357a717f5f7ba8f5e165000b70efcc2
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 06:33:15 2018 -0500

    Note

commit 0c53f080b419151286b6991acff540150f13fccc
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 06:30:54 2018 -0500

    Imports

commit ce94bf9b9c6799bd4220976022895edd4e60abd5
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 06:28:16 2018 -0500

    Moves

commit fdd43c4de98992a6f97a835fdbb525f829ef1d69
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 21:26:09 2018 -0500

    Closes https://github.com/pandas-dev/pandas/issues/22850

commit 5ce06b5bdb8c44043c6463bf8ce3da758800a189
Author: Matthew Roeschke <emailformattr@gmail.com>
Date:   Mon Oct 1 14:22:20 2018 -0700

     BUG: to_datetime preserves name of Index argument in the result (#22918)

    * BUG: to_datetime preserves name of Index argument in the result

    * correct test

* Squashed commit of the following:

commit 11a0d938cdaf7482546691519577b5dd28f69aac
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:26:34 2018 -0500

    typerror

commit a0cd5e79eb06ac71cf2f510b1a2122bc2b21fcf0
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:25:38 2018 -0500

    TypeError for Series

commit 2247461ec0b1017db320cb8581337cba0b5c6679
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:29:29 2018 -0500

    Test op(Series[EA], EA])

commit c9fe5d318d7077f99413532cdaf392ae3ea9cd2c
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:21:33 2018 -0500

    make strict

commit 7ef697cffdcd2f8d701de3cdfd2e6897358effbf
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:14:52 2018 -0500

    Use super

commit 35d42133acbcb3c25308b1c10e0e2dc3fa1052b6
Merge: 0671e7d67 ee808033b
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:11:05 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit 0671e7d67df8b0aa258fd864ef5f3169fe0ffc55
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:10:42 2018 -0500

    Fixup

commit 1b4261f41c70379fa868866bc77e7a31c43baa5d
Merge: c92a4a899 1d9f76c50
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:58:43 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit c92a4a899b8d5e5e6a0479f390a604dc9f624f89
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:56:15 2018 -0500

    Update old test

commit 52538fa03a8c9722ab5c86c88419105b6ebfe5a1
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:51:48 2018 -0500

    BUG: divmod return type

* fixed merge conflict

* Handle divmod test

* extension tests passing

* Squashed commit of the following:

commit c9d6e89a1f401e4f47b384b72030873cc4cc2f2b
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Thu Oct 4 08:34:22 2018 -0500

    xpass -> skip

commit 95d5cbfe4eaf53ed60e84a938723062a14d2d625
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Thu Oct 4 08:22:17 2018 -0500

    typo, import

commit 4e9b7f0a6ceec0275e22f5f1edac1daeb41f5033
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Thu Oct 4 08:18:40 2018 -0500

    doc update

commit cc2bfc8b991f4d8cf46a993bf4205cc80656384e
Merge: 11a0d938c fe67b94e7
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Thu Oct 4 08:15:46 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit fe67b94e7681c1f21fc2be212514ca0d67a6603c
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Thu Oct 4 06:55:09 2018 -0500

    Update type for PeriodDtype / DatetimeTZDtype / IntervalDtype (#22938)

commit b12e5ba55c3691733dab36373e80d1b16134c8c2
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Thu Oct 4 06:30:29 2018 -0500

    Safer is dtype (#22975)

commit c19c8052f384206c3b2cd87f277344d21d0ae2c7
Author: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date:   Thu Oct 4 06:27:54 2018 -0500

    Catch Exception in combine (#22936)

commit d553ab3e5650d105de8e02ae6fd57d03af57b214
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:24:06 2018 +0200

    TST: Fixturize series/test_combine_concat.py (#22964)

commit 4c78b9738e01ae147106301cca76c6b36ee68d06
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:23:39 2018 +0200

    TST: Fixturize series/test_constructors.py (#22965)

commit 45d3bb761dd44edd0853b06fd81f05af915fd695
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:23:20 2018 +0200

    TST: Fixturize series/test_datetime_values.py (#22966)

commit f1a22ff56f895ed340ed7db6dc46841b81d331a1
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:22:21 2018 +0200

    TST: Fixturize series/test_dtypes.py (#22967)

commit abf68fd1d5694403e506416c68f6abec6d780c39
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:21:45 2018 +0200

    TST: Fixturize series/test_io.py (#22972)

commit e6b0c2915f6433d7c29af908f91a6d511177eec1
Author: Anjali2019 <Anjali2019@users.noreply.github.com>
Date:   Thu Oct 4 13:20:46 2018 +0200

    TST: Fixturize series/test_missing.py (#22973)

commit 9b405b829bf5e3fd142cccbcca46df4cc3df4ccb
Author: Joris Van den Bossche <jorisvandenbossche@gmail.com>
Date:   Thu Oct 4 13:16:28 2018 +0200

    CLN: values is required argument in _shallow_copy_with_infer (#22983)

commit c282e310809921a0dadd4446f23c9273c15da443
Author: h-vetinari <33685575+h-vetinari@users.noreply.github.com>
Date:   Thu Oct 4 03:34:35 2018 +0200

    Fix ASV import error (#22978)

commit 11a0d938cdaf7482546691519577b5dd28f69aac
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:26:34 2018 -0500

    typerror

commit a0cd5e79eb06ac71cf2f510b1a2122bc2b21fcf0
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 14:25:38 2018 -0500

    TypeError for Series

commit 2247461ec0b1017db320cb8581337cba0b5c6679
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:29:29 2018 -0500

    Test op(Series[EA], EA])

commit c9fe5d318d7077f99413532cdaf392ae3ea9cd2c
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:21:33 2018 -0500

    make strict

commit 7ef697cffdcd2f8d701de3cdfd2e6897358effbf
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:14:52 2018 -0500

    Use super

commit 35d42133acbcb3c25308b1c10e0e2dc3fa1052b6
Merge: 0671e7d67 ee808033b
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Wed Oct 3 13:11:05 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit 0671e7d67df8b0aa258fd864ef5f3169fe0ffc55
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 11:10:42 2018 -0500

    Fixup

commit 1b4261f41c70379fa868866bc77e7a31c43baa5d
Merge: c92a4a899 1d9f76c50
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Tue Oct 2 10:58:43 2018 -0500

    Merge remote-tracking branch 'upstream/master' into ea-divmod

commit c92a4a899b8d5e5e6a0479f390a604dc9f624f89
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:56:15 2018 -0500

    Update old test

commit 52538fa03a8c9722ab5c86c88419105b6ebfe5a1
Author: Tom Augspurger <tom.w.augspurger@gmail.com>
Date:   Mon Oct 1 16:51:48 2018 -0500

    BUG: divmod return type

* merge conflict

* wip

* indexes passing

* op names

* extension, arrays passing

* fixup

* lint

* Fixed to_timestamp

* Same error message for index, series

* Fix freq handling in to_timestamp

* dtype update

* accept kwargs

* fixups

* updates

* explicit

* add to assert

* wip period_array

* wip period_array

* order

* sort order

* test for hashing

* update

* lint

* boxing

* fix fixtures

* infer

* Remove seemingly unreachable code

* lint

* wip

* Updates for master

* simplify

* wip

* remove view

* simplify

* lint

* Removed add_comparison_methods

* xfail op

* remove some

* constructors

* Constructor cleanup

* misc fixups

* more xfails

* typo

* Added asi8

* Allow setting nan

* revert breaking docs

* Override _add_sub_int_array

* lint

* Update PeriodIndex._simple_new

* Clean up uses of .values, ._values, ._ndarray_values, ._data

* one more values

* remove xfails

* Fixed freq handling in _shallow_copy with a freq

* test updates

* API: Keep PeriodIndex.values an ndarray

* BUG: Raise for non-equal freq in take

* Punt on DataFrame.replace specializing

* lint

* fixed xfail message

* TST: _from_datetime64

* Fixups

- Perf in period_array
- pyarrow error
- py2 compat

* escape

* dtype

* revert and unxfail values

* error catching

* isort

* Avoid PeriodArray.values

* clarify _box_func usage

* TST: unxfail ops tests

* Avoid use of .values

* __setitem__ type

* Misc cleanups

* docstring on PeriodArray
* examples for period_array
* remove _box_values_as_index
* names
* object_dtype
* use __sub__

* lint

* API: remove ordinal from period_array

* catch exception

* misc cleanup

* Handle astype integer size

* Bump test coverage

* remove partial test

* close bracket

* change the test

* isort

* consistent _data

* lint

* ndarray_values -> asi8

* colocate ops

* refactor PeriodIndex.item

remove unused method

* return NotImplemented for Series / Index

* remove xpass

* release note

* types, use data

* remove ufunc xpass
---
 doc/source/whatsnew/v0.24.0.txt               |  29 +-
 pandas/core/arrays/__init__.py                |   2 +-
 pandas/core/arrays/categorical.py             |  23 +-
 pandas/core/arrays/datetimelike.py            |  18 +-
 pandas/core/arrays/datetimes.py               |   4 +-
 pandas/core/arrays/period.py                  | 875 +++++++++++++-----
 pandas/core/dtypes/common.py                  |   6 +-
 pandas/core/dtypes/concat.py                  |   8 +-
 pandas/core/dtypes/dtypes.py                  |   8 +-
 pandas/core/dtypes/generic.py                 |   7 +-
 pandas/core/dtypes/missing.py                 |  12 +-
 pandas/core/indexes/accessors.py              |  13 +-
 pandas/core/indexes/base.py                   |   8 +-
 pandas/core/indexes/datetimelike.py           |  20 +-
 pandas/core/indexes/period.py                 | 569 ++++++++----
 pandas/core/series.py                         |  18 +-
 pandas/io/packers.py                          |   6 +-
 pandas/tests/arithmetic/test_period.py        |  27 +-
 pandas/tests/arrays/test_datetimelike.py      |  18 +-
 pandas/tests/arrays/test_period.py            | 206 +++++
 pandas/tests/dtypes/test_concat.py            |   6 +-
 pandas/tests/dtypes/test_dtypes.py            |   8 +-
 pandas/tests/extension/test_common.py         |   1 -
 pandas/tests/extension/test_integer.py        |   5 -
 pandas/tests/extension/test_period.py         | 155 ++++
 pandas/tests/frame/test_combine_concat.py     |   3 +-
 pandas/tests/frame/test_constructors.py       |   8 +-
 pandas/tests/frame/test_operators.py          |   3 +-
 pandas/tests/frame/test_replace.py            |   5 +-
 pandas/tests/frame/test_reshape.py            |   2 +
 pandas/tests/indexes/common.py                |   3 +-
 pandas/tests/indexes/period/test_astype.py    |   4 +-
 .../tests/indexes/period/test_construction.py |  15 +-
 pandas/tests/indexes/period/test_formats.py   |  54 +-
 pandas/tests/indexes/period/test_indexing.py  |   4 +-
 pandas/tests/indexes/period/test_ops.py       |  22 +-
 pandas/tests/indexes/period/test_tools.py     |   6 +
 pandas/tests/io/formats/test_format.py        |  30 +-
 pandas/tests/io/test_feather.py               |   3 +-
 pandas/tests/io/test_parquet.py               |   8 +-
 pandas/tests/reshape/merge/test_merge.py      |   4 +-
 pandas/tests/reshape/test_concat.py           |   8 +-
 pandas/tests/scalar/test_nat.py               |   5 +-
 pandas/tests/series/test_api.py               |   5 +-
 pandas/tests/series/test_apply.py             |   8 +-
 pandas/tests/series/test_constructors.py      |  29 +-
 pandas/tests/series/test_datetime_values.py   |   3 +-
 pandas/tests/series/test_operators.py         |   7 +-
 pandas/tests/series/test_period.py            |  30 +-
 pandas/tests/test_base.py                     |  17 +-
 pandas/util/testing.py                        |  18 +-
 51 files changed, 1779 insertions(+), 577 deletions(-)
 create mode 100644 pandas/tests/arrays/test_period.py
 create mode 100644 pandas/tests/extension/test_period.py

diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index e4b31b21b11ac..47fef83d3015d 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -145,11 +145,11 @@ Current Behavior:
 
 .. _whatsnew_0240.enhancements.interval:
 
-Storing Interval Data in Series and DataFrame
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+Storing Interval and Period Data in Series and DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-Interval data may now be stored in a ``Series`` or ``DataFrame``, in addition to an
-:class:`IntervalIndex` like previously (:issue:`19453`).
+Interval and Period data may now be stored in a ``Series`` or ``DataFrame``, in addition to an
+:class:`IntervalIndex` and :class:`PeriodIndex` like previously (:issue:`19453`, :issue:`22862`).
 
 .. ipython:: python
 
@@ -157,21 +157,29 @@ Interval data may now be stored in a ``Series`` or ``DataFrame``, in addition to
    ser
    ser.dtype
 
-Previously, these would be cast to a NumPy array of ``Interval`` objects. In general,
-this should result in better performance when storing an array of intervals in
-a :class:`Series`.
+And for periods:
+
+.. ipython:: python
+
+   pser = pd.Series(pd.date_range("2000", freq="D", periods=5))
+   pser
+   pser.dtype
+
+Previously, these would be cast to a NumPy array with object dtype. In general,
+this should result in better performance when storing an array of intervals or periods
+in a :class:`Series` or column of a :class:`DataFrame`.
 
-Note that the ``.values`` of a ``Series`` containing intervals is no longer a NumPy
+Note that the ``.values`` of a ``Series`` containing one of these types is no longer a NumPy
 array, but rather an ``ExtensionArray``:
 
 .. ipython:: python
 
    ser.values
+   pser.values
 
 This is the same behavior as ``Series.values`` for categorical data. See
 :ref:`whatsnew_0240.api_breaking.interval_values` for more.
 
-
 .. _whatsnew_0240.enhancements.other:
 
 Other Enhancements
@@ -360,7 +368,7 @@ New Behavior:
 This mirrors ``CategoricalIndex.values``, which returns a ``Categorical``.
 
 For situations where you need an ``ndarray`` of ``Interval`` objects, use
-:meth:`numpy.asarray` or ``idx.astype(object)``.
+:meth:`numpy.asarray`.
 
 .. ipython:: python
 
@@ -810,6 +818,7 @@ update the ``ExtensionDtype._metadata`` tuple to match the signature of your
 - Updated the ``.type`` attribute for ``PeriodDtype``, ``DatetimeTZDtype``, and ``IntervalDtype`` to be instances of the dtype (``Period``, ``Timestamp``, and ``Interval`` respectively) (:issue:`22938`)
 - :func:`ExtensionArray.isna` is allowed to return an ``ExtensionArray`` (:issue:`22325`).
 - Support for reduction operations such as ``sum``, ``mean`` via opt-in base class method override (:issue:`22762`)
+- :meth:`Series.unstack` no longer converts extension arrays to object-dtype ndarrays. The output ``DataFrame`` will now have the same dtype as the input. This changes behavior for Categorical and Sparse data (:issue:`23077`).
 
 .. _whatsnew_0240.api.incompatibilities:
 
diff --git a/pandas/core/arrays/__init__.py b/pandas/core/arrays/__init__.py
index 0537b79541641..ea8837332633a 100644
--- a/pandas/core/arrays/__init__.py
+++ b/pandas/core/arrays/__init__.py
@@ -4,7 +4,7 @@
 from .categorical import Categorical  # noqa
 from .datetimes import DatetimeArrayMixin  # noqa
 from .interval import IntervalArray  # noqa
-from .period import PeriodArrayMixin  # noqa
+from .period import PeriodArray, period_array  # noqa
 from .timedeltas import TimedeltaArrayMixin  # noqa
 from .integer import (  # noqa
     IntegerArray, integer_array)
diff --git a/pandas/core/arrays/categorical.py b/pandas/core/arrays/categorical.py
index 1bc0d18bead83..4363f3ccb14e2 100644
--- a/pandas/core/arrays/categorical.py
+++ b/pandas/core/arrays/categorical.py
@@ -29,6 +29,7 @@
     is_categorical_dtype,
     is_float_dtype,
     is_integer_dtype,
+    is_object_dtype,
     is_list_like, is_sequence,
     is_scalar, is_iterator,
     is_dict_like)
@@ -342,7 +343,6 @@ def __init__(self, values, categories=None, ordered=None, dtype=None,
         #    a.) use categories, ordered
         #    b.) use values.dtype
         #    c.) infer from values
-
         if dtype is not None:
             # The dtype argument takes precedence over values.dtype (if any)
             if isinstance(dtype, compat.string_types):
@@ -2478,11 +2478,26 @@ def _get_codes_for_values(values, categories):
     utility routine to turn values into codes given the specified categories
     """
     from pandas.core.algorithms import _get_data_algo, _hashtables
-    if is_dtype_equal(values.dtype, categories.dtype):
+    dtype_equal = is_dtype_equal(values.dtype, categories.dtype)
+
+    if dtype_equal:
         # To prevent erroneous dtype coercion in _get_data_algo, retrieve
         # the underlying numpy array. gh-22702
-        values = getattr(values, 'values', values)
-        categories = getattr(categories, 'values', categories)
+        values = getattr(values, '_ndarray_values', values)
+        categories = getattr(categories, '_ndarray_values', categories)
+    elif (is_extension_array_dtype(categories.dtype) and
+          is_object_dtype(values)):
+        # Support inferring the correct extension dtype from an array of
+        # scalar objects. e.g.
+        # Categorical(array[Period, Period], categories=PeriodIndex(...))
+        try:
+            values = (
+                categories.dtype.construct_array_type()._from_sequence(values)
+            )
+        except Exception:
+            # but that may fail for any reason, so fall back to object
+            values = ensure_object(values)
+            categories = ensure_object(categories)
     else:
         values = ensure_object(values)
         categories = ensure_object(categories)
diff --git a/pandas/core/arrays/datetimelike.py b/pandas/core/arrays/datetimelike.py
index 72bc5c2209d04..943c8a94e1e6a 100644
--- a/pandas/core/arrays/datetimelike.py
+++ b/pandas/core/arrays/datetimelike.py
@@ -474,17 +474,8 @@ def _addsub_int_array(self, other, op):
         result : same class as self
         """
         assert op in [operator.add, operator.sub]
-        if is_period_dtype(self):
-            # easy case for PeriodIndex
-            if op is operator.sub:
-                other = -other
-            res_values = checked_add_with_arr(self.asi8, other,
-                                              arr_mask=self._isnan)
-            res_values = res_values.view('i8')
-            res_values[self._isnan] = iNaT
-            return self._from_ordinals(res_values, freq=self.freq)
-
-        elif self.freq is None:
+
+        if self.freq is None:
             # GH#19123
             raise NullFrequencyError("Cannot shift with no freq")
 
@@ -524,10 +515,9 @@ def _addsub_offset_array(self, other, op):
         left = lib.values_from_object(self.astype('O'))
 
         res_values = op(left, np.array(other))
-        kwargs = {}
         if not is_period_dtype(self):
-            kwargs['freq'] = 'infer'
-        return type(self)(res_values, **kwargs)
+            return type(self)(res_values, freq='infer')
+        return self._from_sequence(res_values)
 
     @deprecate_kwarg(old_arg_name='n', new_arg_name='periods')
     def shift(self, periods, freq=None):
diff --git a/pandas/core/arrays/datetimes.py b/pandas/core/arrays/datetimes.py
index b6574c121c087..e269f2e02ddfd 100644
--- a/pandas/core/arrays/datetimes.py
+++ b/pandas/core/arrays/datetimes.py
@@ -832,7 +832,7 @@ def to_period(self, freq=None):
         pandas.PeriodIndex: Immutable ndarray holding ordinal values
         pandas.DatetimeIndex.to_pydatetime: Return DatetimeIndex as object
         """
-        from pandas.core.arrays import PeriodArrayMixin
+        from pandas.core.arrays import PeriodArray
 
         if self.tz is not None:
             warnings.warn("Converting to PeriodArray/Index representation "
@@ -847,7 +847,7 @@ def to_period(self, freq=None):
 
             freq = get_period_alias(freq)
 
-        return PeriodArrayMixin(self.values, freq=freq)
+        return PeriodArray._from_datetime64(self.values, freq, tz=self.tz)
 
     def to_perioddelta(self, freq):
         """
diff --git a/pandas/core/arrays/period.py b/pandas/core/arrays/period.py
index 1426b9690f4df..085298d8324c5 100644
--- a/pandas/core/arrays/period.py
+++ b/pandas/core/arrays/period.py
@@ -1,41 +1,60 @@
 # -*- coding: utf-8 -*-
 from datetime import timedelta
 import operator
-import warnings
 
 import numpy as np
 
+from pandas import compat
+from pandas.compat.numpy import function as nv
 from pandas._libs import lib
 from pandas._libs.tslib import NaT, iNaT
 from pandas._libs.tslibs.period import (
     Period, IncompatibleFrequency, DIFFERENT_FREQ_INDEX,
-    get_period_field_arr, period_asfreq_arr)
+    get_period_field_arr, period_asfreq_arr,
+)
 from pandas._libs.tslibs import period as libperiod
 from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds, Timedelta
 from pandas._libs.tslibs.fields import isleapyear_arr
+from pandas.util._decorators import cache_readonly
+from pandas.util._validators import validate_fillna_kwargs
+import pandas.core.algorithms as algos
+from pandas.core.dtypes.common import (
+    is_integer_dtype, is_float_dtype, is_period_dtype,
+    pandas_dtype,
+    is_datetime64_dtype,
+    is_categorical_dtype,
+    is_timedelta64_dtype,
+    is_list_like,
+    is_array_like,
+    is_object_dtype,
+    is_string_dtype,
+    is_datetime_or_timedelta_dtype,
+    is_dtype_equal,
+    ensure_object,
+    _TD_DTYPE,
+)
 
-from pandas import compat
-from pandas.util._decorators import (cache_readonly, deprecate_kwarg)
 
-from pandas.core.dtypes.common import (
-    is_integer_dtype, is_float_dtype, is_period_dtype, is_timedelta64_dtype,
-    is_datetime64_dtype, _TD_DTYPE)
 from pandas.core.dtypes.dtypes import PeriodDtype
-from pandas.core.dtypes.generic import ABCSeries
+from pandas.core.dtypes.generic import (
+    ABCSeries, ABCIndexClass, ABCPeriodIndex
+)
+from pandas.core.dtypes.missing import isna
+from pandas.core.missing import pad_1d, backfill_1d
 
 import pandas.core.common as com
 
 from pandas.tseries import frequencies
 from pandas.tseries.offsets import Tick, DateOffset
 
+from pandas.core.arrays import ExtensionArray
 from pandas.core.arrays import datetimelike as dtl
-from pandas.core.arrays.datetimelike import DatetimeLikeArrayMixin
 
 
 def _field_accessor(name, alias, docstring=None):
     def f(self):
         base, mult = frequencies.get_freq_code(self.freq)
-        result = get_period_field_arr(alias, self._ndarray_values, base)
+        result = get_period_field_arr(alias, self.asi8, base)
         return result
 
     f.__name__ = name
@@ -51,19 +70,29 @@ def _period_array_cmp(cls, op):
     nat_result = True if opname == '__ne__' else False
 
     def wrapper(self, other):
-        op = getattr(self._ndarray_values, opname)
+        op = getattr(self.asi8, opname)
+        # We want to eventually defer to the Series or PeriodIndex (which will
+        # return here with an unboxed PeriodArray). But before we do that,
+        # we do a bit of validation on type (Period) and freq, so that our
+        # error messages are sensible
+        not_implemented = isinstance(other, (ABCSeries, ABCIndexClass))
+        if not_implemented:
+            other = other._values
+
         if isinstance(other, Period):
             if other.freq != self.freq:
                 msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
                 raise IncompatibleFrequency(msg)
 
             result = op(other.ordinal)
-        elif isinstance(other, PeriodArrayMixin):
+        elif isinstance(other, cls):
             if other.freq != self.freq:
                 msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
                 raise IncompatibleFrequency(msg)
 
-            result = op(other._ndarray_values)
+            if not_implemented:
+                return NotImplemented
+            result = op(other.asi8)
 
             mask = self._isnan | other._isnan
             if mask.any():
@@ -71,7 +100,7 @@ def wrapper(self, other):
 
             return result
         elif other is NaT:
-            result = np.empty(len(self._ndarray_values), dtype=bool)
+            result = np.empty(len(self.asi8), dtype=bool)
             result.fill(nat_result)
         else:
             other = Period(other, freq=self.freq)
@@ -85,94 +114,131 @@ def wrapper(self, other):
     return compat.set_function_name(wrapper, opname, cls)
 
 
-class PeriodArrayMixin(DatetimeLikeArrayMixin):
-    @property
-    def _box_func(self):
-        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
-
-    @cache_readonly
-    def dtype(self):
-        return PeriodDtype.construct_from_string(self.freq)
-
-    @property
-    def _ndarray_values(self):
-        # Ordinals
-        return self._data
-
-    @property
-    def asi8(self):
-        return self._ndarray_values.view('i8')
-
-    @property
-    def freq(self):
-        """Return the frequency object if it is set, otherwise None"""
-        return self._freq
-
-    @freq.setter
-    def freq(self, value):
-        msg = ('Setting {cls}.freq has been deprecated and will be '
-               'removed in a future version; use {cls}.asfreq instead. '
-               'The {cls}.freq setter is not guaranteed to work.')
-        warnings.warn(msg.format(cls=type(self).__name__),
-                      FutureWarning, stacklevel=2)
-        self._freq = value
+class PeriodArray(dtl.DatetimeLikeArrayMixin, ExtensionArray):
+    """
+    Pandas ExtensionArray for storing Period data.
+
+    Users should use :func:`period_array` to create new instances.
+
+    Parameters
+    ----------
+    values : Union[PeriodArray, Series[period], ndarary[int], PeriodIndex]
+        The data to store. These should be arrays that can be directly
+        converted to ordinals without inference or copy (PeriodArray,
+        ndarray[int64]), or a box around such an array (Series[period],
+        PeriodIndex).
+    freq : str or DateOffset
+        The `freq` to use for the array. Mostly applicable when `values`
+        is an ndarray of integers, when `freq` is required. When `values`
+        is a PeriodArray (or box around), it's checked that ``values.freq``
+        matches `freq`.
+    copy : bool, default False
+        Whether to copy the ordinals before storing.
+
+    Notes
+    -----
+    There are two components to a PeriodArray
+
+    - ordinals : integer ndarray
+    - freq : pd.tseries.offsets.Offset
+
+    The values are physically stored as a 1-D ndarray of integers. These are
+    called "ordinals" and represent some kind of offset from a base.
+
+    The `freq` indicates the span covered by each element of the array.
+    All elements in the PeriodArray have the same `freq`.
+
+    See Also
+    --------
+    period_array : Create a new PeriodArray
+    pandas.PeriodIndex : Immutable Index for period data
+    """
+    _attributes = ["freq"]
+    _typ = "periodarray"  # ABCPeriodArray
+
+    # Names others delegate to us
+    _other_ops = []
+    _bool_ops = ['is_leap_year']
+    _object_ops = ['start_time', 'end_time', 'freq']
+    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'weekday', 'week', 'dayofweek',
+                  'dayofyear', 'quarter', 'qyear',
+                  'days_in_month', 'daysinmonth']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
+    _datetimelike_methods = ['strftime', 'to_timestamp', 'asfreq']
 
     # --------------------------------------------------------------------
     # Constructors
+    def __init__(self, values, freq=None, copy=False):
+        if freq is not None:
+            freq = Period._maybe_convert_freq(freq)
 
-    _attributes = ["freq"]
+        if isinstance(values, ABCSeries):
+            values = values._values
+            if not isinstance(values, type(self)):
+                raise TypeError("Incorrect dtype")
 
-    def __new__(cls, values, freq=None, **kwargs):
-        if is_period_dtype(values):
-            # PeriodArray, PeriodIndex
-            if freq is not None and values.freq != freq:
-                raise IncompatibleFrequency(freq, values.freq)
-            freq = values.freq
-            values = values.asi8
+        elif isinstance(values, ABCPeriodIndex):
+            values = values._values
 
-        elif is_datetime64_dtype(values):
-            # TODO: what if it has tz?
-            values = dt64arr_to_periodarr(values, freq)
+        if isinstance(values, type(self)):
+            if freq is not None and freq != values.freq:
+                msg = DIFFERENT_FREQ_INDEX.format(values.freq.freqstr,
+                                                  freq.freqstr)
+                raise IncompatibleFrequency(msg)
+            values, freq = values._data, values.freq
 
-        return cls._simple_new(values, freq=freq, **kwargs)
+        values = np.array(values, dtype='int64', copy=copy)
+        self._data = values
+        if freq is None:
+            raise ValueError('freq is not specified and cannot be inferred')
+        self._dtype = PeriodDtype(freq)
 
     @classmethod
     def _simple_new(cls, values, freq=None, **kwargs):
-        """
-        Values can be any type that can be coerced to Periods.
-        Ordinals in an ndarray are fastpath-ed to `_from_ordinals`
-        """
+        # TODO(DatetimeArray): remove once all constructors are aligned.
+        # alias from PeriodArray.__init__
+        return cls(values, freq=freq, **kwargs)
 
-        if is_period_dtype(values):
-            freq = dtl.validate_dtype_freq(values.dtype, freq)
-            values = values.asi8
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        # type: (Sequence[Optional[Period]], PeriodDtype, bool) -> PeriodArray
+        if dtype:
+            freq = dtype.freq
+        else:
+            freq = None
+        periods = np.asarray(scalars, dtype=object)
+        if copy:
+            periods = periods.copy()
 
-        if not is_integer_dtype(values):
-            values = np.array(values, copy=False)
-            if len(values) > 0 and is_float_dtype(values):
-                raise TypeError("{cls} can't take floats"
-                                .format(cls=cls.__name__))
-            return cls(values, freq=freq, **kwargs)
+        freq = freq or libperiod.extract_freq(periods)
+        ordinals = libperiod.extract_ordinals(periods, freq)
+        return cls(ordinals, freq=freq)
 
-        return cls._from_ordinals(values, freq=freq, **kwargs)
+    def _values_for_factorize(self):
+        return self.asi8, iNaT
 
     @classmethod
-    def _from_ordinals(cls, values, freq=None, **kwargs):
-        """
-        Values should be int ordinals
-        `__new__` & `_simple_new` cooerce to ordinals and call this method
-        """
-        # **kwargs are included so that the signature matches PeriodIndex,
-        #  letting us share _simple_new
+    def _from_factorized(cls, values, original):
+        # type: (Sequence[Optional[Period]], PeriodArray) -> PeriodArray
+        return cls(values, freq=original.freq)
 
-        values = np.array(values, dtype='int64', copy=False)
+    @classmethod
+    def _from_datetime64(cls, data, freq, tz=None):
+        """Construct a PeriodArray from a datetime64 array
 
-        result = object.__new__(cls)
-        result._data = values
-        if freq is None:
-            raise ValueError('freq is not specified and cannot be inferred')
-        result._freq = Period._maybe_convert_freq(freq)
-        return result
+        Parameters
+        ----------
+        data : ndarray[datetime64[ns], datetime64[ns, tz]]
+        freq : str or Tick
+        tz : tzinfo, optional
+
+        Returns
+        -------
+        PeriodArray[freq]
+        """
+        data, freq = dt64arr_to_periodarr(data, freq, tz)
+        return cls(data, freq=freq)
 
     @classmethod
     def _generate_range(cls, start, end, periods, freq, fields):
@@ -195,6 +261,39 @@ def _generate_range(cls, start, end, periods, freq, fields):
 
         return subarr, freq
 
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        freq = {x.freq for x in to_concat}
+        assert len(freq) == 1
+        freq = list(freq)[0]
+        values = np.concatenate([x._data for x in to_concat])
+        return cls(values, freq=freq)
+
+    # --------------------------------------------------------------------
+    # Data / Attributes
+    @property
+    def nbytes(self):
+        # TODO(DatetimeArray): remove
+        return self._data.nbytes
+
+    @cache_readonly
+    def dtype(self):
+        return self._dtype
+
+    @property
+    def _ndarray_values(self):
+        # Ordinals
+        return self._data
+
+    @property
+    def asi8(self):
+        return self._data
+
+    @property
+    def freq(self):
+        """Return the frequency object for this PeriodArray."""
+        return self.dtype.freq
+
     # --------------------------------------------------------------------
     # Vectorized analogues of Period properties
 
@@ -230,6 +329,183 @@ def start_time(self):
     def end_time(self):
         return self.to_timestamp(how='end')
 
+    def __repr__(self):
+        return '<{}>\n{}\nLength: {}, dtype: {}'.format(
+            self.__class__.__name__,
+            [str(s) for s in self],
+            len(self),
+            self.dtype
+        )
+
+    def __setitem__(
+            self,
+            key,   # type: Union[int, Sequence[int], Sequence[bool]]
+            value  # type: Union[NaTType, Period, Sequence[Period]]
+    ):
+        # type: (...) -> None
+        # n.b. the type on `value` is a bit too restrictive.
+        # we also accept a sequence of stuff coercible to a PeriodArray
+        # by period_array, which includes things like ndarray[object],
+        # ndarray[datetime64ns]. I think ndarray[int] / ndarray[str] won't
+        # work, since the freq can't be inferred.
+        if is_list_like(value):
+            if len(key) != len(value) and not com.is_bool_indexer(key):
+                msg = ("shape mismatch: value array of length '{}' does not "
+                       "match indexing result of length '{}'.")
+                raise ValueError(msg.format(len(key), len(value)))
+            if len(key) == 0:
+                return
+
+            value = period_array(value)
+
+            if self.freqstr != value.freqstr:
+                msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, value.freqstr)
+                raise IncompatibleFrequency(msg)
+
+            value = value.asi8
+        elif isinstance(value, Period):
+
+            if self.freqstr != value.freqstr:
+                msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, value.freqstr)
+                raise IncompatibleFrequency(msg)
+
+            value = value.ordinal
+        elif isna(value):
+            value = iNaT
+        else:
+            msg = ("'value' should be a 'Period', 'NaT', or array of those. "
+                   "Got '{}' instead.".format(type(value).__name__))
+            raise TypeError(msg)
+        self._data[key] = value
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        if allow_fill:
+            if isna(fill_value):
+                fill_value = iNaT
+            elif isinstance(fill_value, Period):
+                if self.freq != fill_value.freq:
+                    msg = DIFFERENT_FREQ_INDEX.format(
+                        self.freq.freqstr,
+                        fill_value.freqstr
+                    )
+                    raise IncompatibleFrequency(msg)
+
+                fill_value = fill_value.ordinal
+            else:
+                msg = "'fill_value' should be a Period. Got '{}'."
+                raise ValueError(msg.format(fill_value))
+
+        new_values = algos.take(self._data,
+                                indices,
+                                allow_fill=allow_fill,
+                                fill_value=fill_value)
+
+        return type(self)(new_values, self.freq)
+
+    def isna(self):
+        return self._data == iNaT
+
+    def fillna(self, value=None, method=None, limit=None):
+        # TODO(#20300)
+        # To avoid converting to object, we re-implement here with the changes
+        # 1. Passing `_data` to func instead of self.astype(object)
+        # 2. Re-boxing output of 1.
+        # #20300 should let us do this kind of logic on ExtensionArray.fillna
+        # and we can use it.
+
+        if isinstance(value, ABCSeries):
+            value = value._values
+
+        value, method = validate_fillna_kwargs(value, method)
+
+        mask = self.isna()
+
+        if is_array_like(value):
+            if len(value) != len(self):
+                raise ValueError("Length of 'value' does not match. Got ({}) "
+                                 " expected {}".format(len(value), len(self)))
+            value = value[mask]
+
+        if mask.any():
+            if method is not None:
+                func = pad_1d if method == 'pad' else backfill_1d
+                new_values = func(self._data, limit=limit,
+                                  mask=mask)
+                new_values = type(self)(new_values, freq=self.freq)
+            else:
+                # fill with value
+                new_values = self.copy()
+                new_values[mask] = value
+        else:
+            new_values = self.copy()
+        return new_values
+
+    def copy(self, deep=False):
+        return type(self)(self._data.copy(), freq=self.freq)
+
+    def value_counts(self, dropna=False):
+        from pandas import Series, PeriodIndex
+
+        if dropna:
+            values = self[~self.isna()]._data
+        else:
+            values = self._data
+
+        cls = type(self)
+
+        result = algos.value_counts(values, sort=False)
+        index = PeriodIndex(cls(result.index, freq=self.freq),
+                            name=result.index.name)
+        return Series(result.values, index=index, name=result.name)
+
+    def shift(self, periods=1):
+        """
+        Shift values by desired number.
+
+        Newly introduced missing values are filled with
+        ``self.dtype.na_value``.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        periods : int, default 1
+            The number of periods to shift. Negative values are allowed
+            for shifting backwards.
+
+        Returns
+        -------
+        shifted : PeriodArray
+        """
+        # TODO(DatetimeArray): remove
+        # The semantics for Index.shift differ from EA.shift
+        # then just call super.
+        return ExtensionArray.shift(self, periods)
+
+    def _time_shift(self, n, freq=None):
+        """
+        Shift each value by `periods`.
+
+        Note this is different from ExtensionArray.shift, which
+        shifts the *position* of each element, padding the end with
+        missing values.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods to shift by.
+        freq : pandas.DateOffset, pandas.Timedelta, or string
+            Frequency increment to shift by.
+        """
+        values = self._data + n * self.freq.n
+        if self.hasnans:
+            values[self._isnan] = iNaT
+        return type(self)(values, freq=self.freq)
+
+    @property
+    def _box_func(self):
+        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
+
     def asfreq(self, freq=None, how='E'):
         """
         Convert the Period Array/Index to the specified frequency `freq`.
@@ -287,7 +563,7 @@ def asfreq(self, freq=None, how='E'):
         if self.hasnans:
             new_data[self._isnan] = iNaT
 
-        return self._shallow_copy(new_data, freq=freq)
+        return type(self)(new_data, freq=freq)
 
     def to_timestamp(self, freq=None, how='start'):
         """
@@ -327,126 +603,9 @@ def to_timestamp(self, freq=None, how='start'):
         base, mult = frequencies.get_freq_code(freq)
         new_data = self.asfreq(freq, how=how)
 
-        new_data = libperiod.periodarr_to_dt64arr(new_data._ndarray_values,
-                                                  base)
+        new_data = libperiod.periodarr_to_dt64arr(new_data.asi8, base)
         return DatetimeArrayMixin(new_data, freq='infer')
 
-    # ------------------------------------------------------------------
-    # Arithmetic Methods
-
-    _create_comparison_method = classmethod(_period_array_cmp)
-
-    def _sub_datelike(self, other):
-        assert other is not NaT
-        return NotImplemented
-
-    def _sub_period(self, other):
-        # If the operation is well-defined, we return an object-Index
-        # of DateOffsets.  Null entries are filled with pd.NaT
-        if self.freq != other.freq:
-            msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-
-        asi8 = self.asi8
-        new_data = asi8 - other.ordinal
-        new_data = np.array([self.freq * x for x in new_data])
-
-        if self.hasnans:
-            new_data[self._isnan] = NaT
-
-        return new_data
-
-    def _add_offset(self, other):
-        assert not isinstance(other, Tick)
-        base = frequencies.get_base_alias(other.rule_code)
-        if base != self.freq.rule_code:
-            msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-        return self._time_shift(other.n)
-
-    def _add_delta_td(self, other):
-        assert isinstance(self.freq, Tick)  # checked by calling function
-        assert isinstance(other, (timedelta, np.timedelta64, Tick))
-
-        delta = self._check_timedeltalike_freq_compat(other)
-
-        # Note: when calling parent class's _add_delta_td, it will call
-        #  delta_to_nanoseconds(delta).  Because delta here is an integer,
-        #  delta_to_nanoseconds will return it unchanged.
-        return DatetimeLikeArrayMixin._add_delta_td(self, delta)
-
-    def _add_delta_tdi(self, other):
-        assert isinstance(self.freq, Tick)  # checked by calling function
-
-        delta = self._check_timedeltalike_freq_compat(other)
-        return self._addsub_int_array(delta, operator.add)
-
-    def _add_delta(self, other):
-        """
-        Add a timedelta-like, Tick, or TimedeltaIndex-like object
-        to self.
-
-        Parameters
-        ----------
-        other : {timedelta, np.timedelta64, Tick,
-                 TimedeltaIndex, ndarray[timedelta64]}
-
-        Returns
-        -------
-        result : same type as self
-        """
-        if not isinstance(self.freq, Tick):
-            # We cannot add timedelta-like to non-tick PeriodArray
-            raise IncompatibleFrequency("Input has different freq from "
-                                        "{cls}(freq={freqstr})"
-                                        .format(cls=type(self).__name__,
-                                                freqstr=self.freqstr))
-
-        # TODO: standardize across datetimelike subclasses whether to return
-        #  i8 view or _shallow_copy
-        if isinstance(other, (Tick, timedelta, np.timedelta64)):
-            new_values = self._add_delta_td(other)
-            return self._shallow_copy(new_values)
-        elif is_timedelta64_dtype(other):
-            # ndarray[timedelta64] or TimedeltaArray/index
-            new_values = self._add_delta_tdi(other)
-            return self._shallow_copy(new_values)
-        else:  # pragma: no cover
-            raise TypeError(type(other).__name__)
-
-    @deprecate_kwarg(old_arg_name='n', new_arg_name='periods')
-    def shift(self, periods):
-        """
-        Shift index by desired number of increments.
-
-        This method is for shifting the values of period indexes
-        by a specified time increment.
-
-        Parameters
-        ----------
-        periods : int
-            Number of periods (or increments) to shift by,
-            can be positive or negative.
-
-            .. versionchanged:: 0.24.0
-
-        Returns
-        -------
-        pandas.PeriodIndex
-            Shifted index.
-
-        See Also
-        --------
-        DatetimeIndex.shift : Shift values of DatetimeIndex.
-        """
-        return self._time_shift(periods)
-
-    def _time_shift(self, n):
-        values = self._ndarray_values + n * self.freq.n
-        if self.hasnans:
-            values[self._isnan] = iNaT
-        return self._shallow_copy(values=values)
-
     def _maybe_convert_timedelta(self, other):
         """
         Convert timedelta-like input to an integer multiple of self.freq
@@ -489,6 +648,29 @@ def _maybe_convert_timedelta(self, other):
         raise IncompatibleFrequency(msg.format(cls=type(self).__name__,
                                                freqstr=self.freqstr))
 
+    # ------------------------------------------------------------------
+    # Formatting
+    def _format_native_types(self, na_rep=u'NaT', date_format=None,
+                             **kwargs):
+        """ actually format my specific types """
+        # TODO(DatetimeArray): remove
+        values = self.astype(object)
+
+        if date_format:
+            formatter = lambda dt: dt.strftime(date_format)
+        else:
+            formatter = lambda dt: u'%s' % dt
+
+        if self.hasnans:
+            mask = self._isnan
+            values[mask] = na_rep
+            imask = ~mask
+            values[imask] = np.array([formatter(dt) for dt
+                                      in values[imask]])
+        else:
+            values = np.array([formatter(dt) for dt in values])
+        return values
+
     def _check_timedeltalike_freq_compat(self, other):
         """
         Arithmetic operations with timedelta-like scalars or array `other`
@@ -541,21 +723,298 @@ def _check_timedeltalike_freq_compat(self, other):
                                     .format(cls=type(self).__name__,
                                             freqstr=self.freqstr))
 
+    def repeat(self, repeats, *args, **kwargs):
+        """
+        Repeat elements of a Categorical.
+
+        See also
+        --------
+        numpy.ndarray.repeat
+        """
+        # TODO(DatetimeArray): remove
+        nv.validate_repeat(args, kwargs)
+        values = self._data.repeat(repeats)
+        return type(self)(values, self.freq)
+
+    # Delegation...
+    def strftime(self, date_format):
+        return self._format_native_types(date_format=date_format)
+
+    def astype(self, dtype, copy=True):
+        # TODO: Figure out something better here...
+        # We have DatetimeLikeArrayMixin ->
+        #     super(...), which ends up being... DatetimeIndexOpsMixin?
+        # this is complicated.
+        # need a pandas_astype(arr, dtype).
+        from pandas import Categorical
+
+        dtype = pandas_dtype(dtype)
+
+        if is_object_dtype(dtype):
+            return np.asarray(self, dtype=object)
+        elif is_string_dtype(dtype) and not is_categorical_dtype(dtype):
+            return self._format_native_types()
+        elif is_integer_dtype(dtype):
+            values = self._data
+
+            if values.dtype != dtype:
+                # int32 vs. int64
+                values = values.astype(dtype)
+
+            elif copy:
+                values = values.copy()
+
+            return values
+        elif (is_datetime_or_timedelta_dtype(dtype) and
+              not is_dtype_equal(self.dtype, dtype)) or is_float_dtype(dtype):
+            # disallow conversion between datetime/timedelta,
+            # and conversions for any datetimelike to float
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+        elif is_categorical_dtype(dtype):
+            return Categorical(self, dtype=dtype)
+        elif is_period_dtype(dtype):
+            return self.asfreq(dtype.freq)
+        else:
+            return np.asarray(self, dtype=dtype)
+
+    @property
+    def flags(self):
+        # TODO: remove
+        # We need this since reduction.SeriesBinGrouper uses values.flags
+        # Ideally, we wouldn't be passing objects down there in the first
+        # place.
+        return self._data.flags
+
+    # ------------------------------------------------------------------
+    # Arithmetic Methods
+    _create_comparison_method = classmethod(_period_array_cmp)
+
+    def _sub_datelike(self, other):
+        assert other is not NaT
+        return NotImplemented
+
+    def _sub_period(self, other):
+        # If the operation is well-defined, we return an object-Index
+        # of DateOffsets.  Null entries are filled with pd.NaT
+        if self.freq != other.freq:
+            msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        asi8 = self.asi8
+        new_data = asi8 - other.ordinal
+        new_data = np.array([self.freq * x for x in new_data])
+
+        if self.hasnans:
+            new_data[self._isnan] = NaT
 
-PeriodArrayMixin._add_comparison_ops()
-PeriodArrayMixin._add_datetimelike_methods()
+        return new_data
+
+    def _addsub_int_array(
+            self,
+            other,  # type: Union[Index, ExtensionArray, np.ndarray[int]]
+            op,     # type: Callable[Any, Any]
+    ):
+        # type: (...) -> PeriodArray
+        assert op in [operator.add, operator.sub]
+        # easy case for PeriodIndex
+        if op is operator.sub:
+            other = -other
+        res_values = algos.checked_add_with_arr(self.asi8, other,
+                                                arr_mask=self._isnan)
+        res_values = res_values.view('i8')
+        res_values[self._isnan] = iNaT
+        return type(self)(res_values, freq=self.freq)
+
+    def _add_offset(self, other):
+        assert not isinstance(other, Tick)
+        base = frequencies.get_base_alias(other.rule_code)
+        if base != self.freq.rule_code:
+            msg = DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
+            raise IncompatibleFrequency(msg)
+        return self._time_shift(other.n)
+
+    def _add_delta_td(self, other):
+        assert isinstance(self.freq, Tick)  # checked by calling function
+        assert isinstance(other, (timedelta, np.timedelta64, Tick))
+
+        delta = self._check_timedeltalike_freq_compat(other)
+
+        # Note: when calling parent class's _add_delta_td, it will call
+        #  delta_to_nanoseconds(delta).  Because delta here is an integer,
+        #  delta_to_nanoseconds will return it unchanged.
+        ordinals = super(PeriodArray, self)._add_delta_td(delta)
+        return type(self)(ordinals, self.freq)
+
+    def _add_delta_tdi(self, other):
+        assert isinstance(self.freq, Tick)  # checked by calling function
+
+        delta = self._check_timedeltalike_freq_compat(other)
+        return self._addsub_int_array(delta, operator.add)
+
+    def _add_delta(self, other):
+        """
+        Add a timedelta-like, Tick, or TimedeltaIndex-like object
+        to self.
+
+        Parameters
+        ----------
+        other : {timedelta, np.timedelta64, Tick,
+                 TimedeltaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : same type as self
+        """
+        if not isinstance(self.freq, Tick):
+            # We cannot add timedelta-like to non-tick PeriodArray
+            raise IncompatibleFrequency("Input has different freq from "
+                                        "{cls}(freq={freqstr})"
+                                        .format(cls=type(self).__name__,
+                                                freqstr=self.freqstr))
+
+        # TODO: standardize across datetimelike subclasses whether to return
+        #  i8 view or _shallow_copy
+        if isinstance(other, (Tick, timedelta, np.timedelta64)):
+            return self._add_delta_td(other)
+        elif is_timedelta64_dtype(other):
+            # ndarray[timedelta64] or TimedeltaArray/index
+            return self._add_delta_tdi(other)
+        else:  # pragma: no cover
+            raise TypeError(type(other).__name__)
+
+
+PeriodArray._add_comparison_ops()
+PeriodArray._add_datetimelike_methods()
 
 
 # -------------------------------------------------------------------
 # Constructor Helpers
 
+def period_array(data, freq=None, copy=False):
+    # type: (Sequence[Optional[Period]], Optional[Tick]) -> PeriodArray
+    """
+    Construct a new PeriodArray from a sequence of Period scalars.
+
+    Parameters
+    ----------
+    data : Sequence of Period objects
+        A sequence of Period objects. These are required to all have
+        the same ``freq.`` Missing values can be indicated by ``None``
+        or ``pandas.NaT``.
+    freq : str, Tick, or Offset
+        The frequency of every element of the array. This can be specified
+        to avoid inferring the `freq` from `data`.
+    copy : bool, default False
+        Whether to ensure a copy of the data is made.
+
+    Returns
+    -------
+    PeriodArray
+
+    See Also
+    --------
+    PeriodArray
+    pandas.PeriodIndex
+
+    Examples
+    --------
+    >>> period_array([pd.Period('2017', freq='A'),
+    ...               pd.Period('2018', freq='A')])
+    <PeriodArray>
+    ['2017', '2018']
+    Length: 2, dtype: period[A-DEC]
+
+    >>> period_array([pd.Period('2017', freq='A'),
+    ...               pd.Period('2018', freq='A'),
+    ...               pd.NaT])
+    <PeriodArray>
+    ['2017', '2018', 'NaT']
+    Length: 3, dtype: period[A-DEC]
+
+    Integers that look like years are handled
+
+    >>> period_array([2000, 2001, 2002], freq='D')
+    ['2000-01-01', '2001-01-01', '2002-01-01']
+    Length: 3, dtype: period[D]
+
+    Datetime-like strings may also be passed
+
+    >>> period_array(['2000-Q1', '2000-Q2', '2000-Q3', '2000-Q4'], freq='Q')
+    <PeriodArray>
+    ['2000Q1', '2000Q2', '2000Q3', '2000Q4']
+    Length: 4, dtype: period[Q-DEC]
+    """
+    if is_datetime64_dtype(data):
+        return PeriodArray._from_datetime64(data, freq)
+    if isinstance(data, (ABCPeriodIndex, ABCSeries, PeriodArray)):
+        return PeriodArray(data, freq)
+
+    # other iterable of some kind
+    if not isinstance(data, (np.ndarray, list, tuple)):
+        data = list(data)
+
+    data = np.asarray(data)
+
+    if freq:
+        dtype = PeriodDtype(freq)
+    else:
+        dtype = None
+
+    if is_float_dtype(data) and len(data) > 0:
+        raise TypeError("PeriodIndex does not allow "
+                        "floating point in construction")
+
+    data = ensure_object(data)
+
+    return PeriodArray._from_sequence(data, dtype=dtype)
+
+
 def dt64arr_to_periodarr(data, freq, tz=None):
+    """
+    Convert an datetime-like array to values Period ordinals.
+
+    Parameters
+    ----------
+    data : Union[Series[datetime64[ns]], DatetimeIndex, ndarray[datetime64ns]]
+    freq : Optional[Union[str, Tick]]
+        Must match the `freq` on the `data` if `data` is a DatetimeIndex
+        or Series.
+    tz : Optional[tzinfo]
+
+    Returns
+    -------
+    ordinals : ndarray[int]
+    freq : Tick
+        The frequencey extracted from the Series or DatetimeIndex if that's
+        used.
+
+    """
     if data.dtype != np.dtype('M8[ns]'):
         raise ValueError('Wrong dtype: %s' % data.dtype)
 
-    freq = Period._maybe_convert_freq(freq)
+    if freq is not None:
+        freq = Period._maybe_convert_freq(freq)
+
+    if isinstance(data, ABCIndexClass):
+        if freq is None:
+            freq = data.freq
+        elif freq != data.freq:
+            msg = DIFFERENT_FREQ_INDEX.format(freq.freqstr, data.freq.freqstr)
+            raise IncompatibleFrequency(msg)
+        data = data._values
+
+    elif isinstance(data, ABCSeries):
+        if freq is None:
+            freq = data.dt.freq
+        elif freq != data.dt.freq:
+            msg = DIFFERENT_FREQ_INDEX.format(freq.freqstr,
+                                              data.dt.freq.freqstr)
+            raise IncompatibleFrequency(msg)
+        data = data._values
+
     base, mult = frequencies.get_freq_code(freq)
-    return libperiod.dt64arr_to_periodarr(data.view('i8'), base, tz)
+    return libperiod.dt64arr_to_periodarr(data.view('i8'), base, tz), freq
 
 
 def _get_ordinal_range(start, end, periods, freq, mult=1):
diff --git a/pandas/core/dtypes/common.py b/pandas/core/dtypes/common.py
index af5e1523c7cec..da26c2ef74b41 100644
--- a/pandas/core/dtypes/common.py
+++ b/pandas/core/dtypes/common.py
@@ -14,7 +14,7 @@
 from pandas.core.dtypes.generic import (
     ABCCategorical, ABCPeriodIndex, ABCDatetimeIndex, ABCSeries,
     ABCSparseArray, ABCSparseSeries, ABCCategoricalIndex, ABCIndexClass,
-    ABCDateOffset)
+    ABCDateOffset, ABCPeriodArray)
 from pandas.core.dtypes.inference import (  # noqa:F401
     is_bool, is_integer, is_float, is_number, is_decimal, is_complex,
     is_re, is_re_compilable, is_dict_like, is_string_like, is_file_like,
@@ -638,10 +638,10 @@ def is_period_arraylike(arr):
     True
     """
 
-    if isinstance(arr, ABCPeriodIndex):
+    if isinstance(arr, (ABCPeriodIndex, ABCPeriodArray)):
         return True
     elif isinstance(arr, (np.ndarray, ABCSeries)):
-        return arr.dtype == object and lib.infer_dtype(arr) == 'period'
+        return is_period_dtype(arr.dtype)
     return getattr(arr, 'inferred_type', None) == 'period'
 
 
diff --git a/pandas/core/dtypes/concat.py b/pandas/core/dtypes/concat.py
index df67afd406d06..702a0246a95dd 100644
--- a/pandas/core/dtypes/concat.py
+++ b/pandas/core/dtypes/concat.py
@@ -470,10 +470,10 @@ def _concat_datetime(to_concat, axis=0, typs=None):
                                axis=axis).view(_TD_DTYPE)
 
     elif any(typ.startswith('period') for typ in typs):
-        # PeriodIndex must be handled by PeriodIndex,
-        # Thus can't meet this condition ATM
-        # Must be changed when we adding PeriodDtype
-        raise NotImplementedError("unable to concat PeriodDtype")
+        assert len(typs) == 1
+        cls = to_concat[0]
+        new_values = cls._concat_same_type(to_concat)
+        return new_values
 
 
 def _convert_datetimelike_to_object(x):
diff --git a/pandas/core/dtypes/dtypes.py b/pandas/core/dtypes/dtypes.py
index f07fb3cd80eab..961c8f1dbe537 100644
--- a/pandas/core/dtypes/dtypes.py
+++ b/pandas/core/dtypes/dtypes.py
@@ -588,7 +588,7 @@ def __eq__(self, other):
                 str(self.tz) == str(other.tz))
 
 
-class PeriodDtype(PandasExtensionDtype):
+class PeriodDtype(ExtensionDtype, PandasExtensionDtype):
     """
     A Period duck-typed class, suitable for holding a period with freq dtype.
 
@@ -706,6 +706,12 @@ def is_dtype(cls, dtype):
                 return False
         return super(PeriodDtype, cls).is_dtype(dtype)
 
+    @classmethod
+    def construct_array_type(cls):
+        from pandas.core.arrays import PeriodArray
+
+        return PeriodArray
+
 
 @register_extension_dtype
 class IntervalDtype(PandasExtensionDtype, ExtensionDtype):
diff --git a/pandas/core/dtypes/generic.py b/pandas/core/dtypes/generic.py
index cb54c94d29205..f6926a192a724 100644
--- a/pandas/core/dtypes/generic.py
+++ b/pandas/core/dtypes/generic.py
@@ -53,12 +53,17 @@ def _check(cls, inst):
                                         ('sparse_array', 'sparse_series'))
 ABCCategorical = create_pandas_abc_type("ABCCategorical", "_typ",
                                         ("categorical"))
+ABCPeriodArray = create_pandas_abc_type("ABCPeriodArray", "_typ",
+                                        ("periodarray", ))
 ABCPeriod = create_pandas_abc_type("ABCPeriod", "_typ", ("period", ))
 ABCDateOffset = create_pandas_abc_type("ABCDateOffset", "_typ",
                                        ("dateoffset",))
 ABCInterval = create_pandas_abc_type("ABCInterval", "_typ", ("interval", ))
 ABCExtensionArray = create_pandas_abc_type("ABCExtensionArray", "_typ",
-                                           ("extension", "categorical",))
+                                           ("extension",
+                                            "categorical",
+                                            "periodarray",
+                                            ))
 
 
 class _ABCGeneric(type):
diff --git a/pandas/core/dtypes/missing.py b/pandas/core/dtypes/missing.py
index e48d09ae9a96a..1800c32add9b1 100644
--- a/pandas/core/dtypes/missing.py
+++ b/pandas/core/dtypes/missing.py
@@ -187,10 +187,18 @@ def _use_inf_as_na(key):
 
 
 def _isna_ndarraylike(obj):
-    values = getattr(obj, 'values', obj)
+    is_extension = is_extension_array_dtype(obj)
+
+    if not is_extension:
+        # Avoid accessing `.values` on things like
+        # PeriodIndex, which may be expensive.
+        values = getattr(obj, 'values', obj)
+    else:
+        values = obj
+
     dtype = values.dtype
 
-    if is_extension_array_dtype(obj):
+    if is_extension:
         if isinstance(obj, (ABCIndexClass, ABCSeries)):
             values = obj._values
         else:
diff --git a/pandas/core/indexes/accessors.py b/pandas/core/indexes/accessors.py
index a1868980faed3..35b9799579628 100644
--- a/pandas/core/indexes/accessors.py
+++ b/pandas/core/indexes/accessors.py
@@ -15,7 +15,7 @@
 from pandas.core.accessor import PandasDelegate, delegate_names
 from pandas.core.base import NoNewAttributesMixin, PandasObject
 from pandas.core.indexes.datetimes import DatetimeIndex
-from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.period import PeriodArray
 from pandas.core.indexes.timedeltas import TimedeltaIndex
 from pandas.core.algorithms import take_1d
 
@@ -46,7 +46,8 @@ def _get_values(self):
 
         else:
             if is_period_arraylike(data):
-                return PeriodIndex(data, copy=False, name=self.name)
+                # TODO: use to_period_array
+                return PeriodArray(data, copy=False)
             if is_datetime_arraylike(data):
                 return DatetimeIndex(data, copy=False, name=self.name)
 
@@ -270,11 +271,11 @@ def freq(self):
         return self._get_values().inferred_freq
 
 
-@delegate_names(delegate=PeriodIndex,
-                accessors=PeriodIndex._datetimelike_ops,
+@delegate_names(delegate=PeriodArray,
+                accessors=PeriodArray._datetimelike_ops,
                 typ="property")
-@delegate_names(delegate=PeriodIndex,
-                accessors=PeriodIndex._datetimelike_methods,
+@delegate_names(delegate=PeriodArray,
+                accessors=PeriodArray._datetimelike_methods,
                 typ="method")
 class PeriodProperties(Properties):
     """
diff --git a/pandas/core/indexes/base.py b/pandas/core/indexes/base.py
index e5760f0141efb..e9b0b087179c9 100644
--- a/pandas/core/indexes/base.py
+++ b/pandas/core/indexes/base.py
@@ -317,6 +317,11 @@ def __new__(cls, data=None, dtype=None, copy=False, name=None,
             else:
                 return result
 
+        elif is_period_dtype(data) and not is_object_dtype(dtype):
+            from pandas import PeriodIndex
+            result = PeriodIndex(data, copy=copy, name=name, **kwargs)
+            return result
+
         # extension dtype
         elif is_extension_array_dtype(data) or is_extension_array_dtype(dtype):
             data = np.asarray(data)
@@ -389,8 +394,7 @@ def __new__(cls, data=None, dtype=None, copy=False, name=None,
             # maybe coerce to a sub-class
             from pandas.core.indexes.period import (
                 PeriodIndex, IncompatibleFrequency)
-            if isinstance(data, PeriodIndex):
-                return PeriodIndex(data, copy=copy, name=name, **kwargs)
+
             if is_signed_integer_dtype(data.dtype):
                 from .numeric import Int64Index
                 return Int64Index(data, copy=copy, dtype=dtype, name=name)
diff --git a/pandas/core/indexes/datetimelike.py b/pandas/core/indexes/datetimelike.py
index 53f8d42f46d55..14325f42ff0d8 100644
--- a/pandas/core/indexes/datetimelike.py
+++ b/pandas/core/indexes/datetimelike.py
@@ -35,6 +35,7 @@
 
 import pandas.io.formats.printing as printing
 
+from pandas.core.arrays import PeriodArray
 from pandas.core.arrays.datetimelike import DatetimeLikeArrayMixin
 from pandas.core.indexes.base import Index, _index_shared_docs
 from pandas.util._decorators import Appender, cache_readonly
@@ -369,6 +370,9 @@ def sort_values(self, return_indexer=False, ascending=True):
             if not ascending:
                 sorted_values = sorted_values[::-1]
 
+            sorted_values = self._maybe_box_as_values(sorted_values,
+                                                      **attribs)
+
             return self._simple_new(sorted_values, **attribs)
 
     @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
@@ -685,14 +689,28 @@ def _concat_same_dtype(self, to_concat, name):
             return _concat._concat_datetimetz(to_concat, name)
         else:
             new_data = np.concatenate([c.asi8 for c in to_concat])
+
+        new_data = self._maybe_box_as_values(new_data, **attribs)
         return self._simple_new(new_data, **attribs)
 
+    def _maybe_box_as_values(self, values, **attribs):
+        # TODO(DatetimeArray): remove
+        # This is a temporary shim while PeriodArray is an ExtensoinArray,
+        # but others are not. When everyone is an ExtensionArray, this can
+        # be removed. Currently used in
+        # - sort_values
+        # - _concat_same_dtype
+        return values
+
     def astype(self, dtype, copy=True):
         if is_object_dtype(dtype):
             return self._box_values_as_index()
         elif is_string_dtype(dtype) and not is_categorical_dtype(dtype):
             return Index(self.format(), name=self.name, dtype=object)
         elif is_integer_dtype(dtype):
+            # TODO(DatetimeArray): use self._values here.
+            # Can't use ._values currently, because that returns a
+            # DatetimeIndex, which throws us in an infinite loop.
             return Index(self.values.astype('i8', copy=copy), name=self.name,
                          dtype='i8')
         elif (is_datetime_or_timedelta_dtype(dtype) and
@@ -727,7 +745,7 @@ def _ensure_datetimelike_to_i8(other, to_utc=False):
     """
     if is_scalar(other) and isna(other):
         return iNaT
-    elif isinstance(other, ABCIndexClass):
+    elif isinstance(other, (PeriodArray, ABCIndexClass)):
         # convert tz if needed
         if getattr(other, 'tz', None) is not None:
             if to_utc:
diff --git a/pandas/core/indexes/period.py b/pandas/core/indexes/period.py
index ff875c71683ac..d23d56cba98ae 100644
--- a/pandas/core/indexes/period.py
+++ b/pandas/core/indexes/period.py
@@ -1,61 +1,106 @@
 # pylint: disable=E1101,E1103,W0232
 from datetime import datetime
 import numpy as np
+import operator
 import warnings
 
 from pandas.core import common as com
 from pandas.core.dtypes.common import (
     is_integer,
     is_float,
+    is_float_dtype,
     is_integer_dtype,
-    is_scalar,
-    is_datetime64_dtype,
     is_datetime64_any_dtype,
-    is_period_dtype,
     is_bool_dtype,
     pandas_dtype,
-    ensure_object)
-
-from pandas.tseries.frequencies import get_freq_code as _gfc
+)
 
+from pandas.core.accessor import PandasDelegate, delegate_names
 from pandas.core.indexes.datetimes import DatetimeIndex, Int64Index, Index
 from pandas.core.indexes.datetimelike import (
-    DatelikeOps, DatetimeIndexOpsMixin,
-    wrap_array_method, wrap_field_accessor)
+    DatelikeOps, DatetimeIndexOpsMixin, wrap_arithmetic_op
+)
 from pandas.core.tools.datetimes import parse_time_string
 
-from pandas._libs.lib import infer_dtype
 from pandas._libs import tslib, index as libindex
 from pandas._libs.tslibs.period import (Period, IncompatibleFrequency,
                                         DIFFERENT_FREQ_INDEX)
-from pandas._libs.tslibs import resolution, period
+
+from pandas._libs.tslibs import resolution
 
 from pandas.core.algorithms import unique1d
-from pandas.core.arrays import datetimelike as dtl
-from pandas.core.arrays.period import PeriodArrayMixin, dt64arr_to_periodarr
+from pandas.core.dtypes.dtypes import PeriodDtype
+from pandas.core.arrays.period import PeriodArray, period_array
 from pandas.core.base import _shared_docs
 from pandas.core.indexes.base import _index_shared_docs, ensure_index
 
 from pandas import compat
-from pandas.util._decorators import Appender, Substitution, cache_readonly
+from pandas.util._decorators import (
+    Appender, Substitution, cache_readonly, deprecate_kwarg
+)
 
 import pandas.core.indexes.base as ibase
 _index_doc_kwargs = dict(ibase._index_doc_kwargs)
 _index_doc_kwargs.update(
     dict(target_klass='PeriodIndex or list of Periods'))
 
+
+def _wrap_field_accessor(name):
+    fget = getattr(PeriodArray, name).fget
+
+    def f(self):
+        result = fget(self)
+        return Index(result, name=self.name)
+
+    f.__name__ = name
+    f.__doc__ = fget.__doc__
+    return property(f)
+
 # --- Period index sketch
 
 
 def _new_PeriodIndex(cls, **d):
     # GH13277 for unpickling
-    if d['data'].dtype == 'int64':
-        values = d.pop('data')
-    return cls._from_ordinals(values=values, **d)
+    values = d.pop('data')
+    if values.dtype == 'int64':
+        freq = d.pop('freq', None)
+        values = PeriodArray(values, freq=freq)
+        return cls._simple_new(values, **d)
+    else:
+        return cls(values, **d)
+
+
+class PeriodDelegateMixin(PandasDelegate):
+    """
+    Delegate from PeriodIndex to PeriodArray.
+    """
+    def _delegate_property_get(self, name, *args, **kwargs):
+        result = getattr(self._data, name)
+        box_ops = (
+            set(PeriodArray._datetimelike_ops) - set(PeriodArray._bool_ops)
+        )
+        if name in box_ops:
+            result = Index(result, name=self.name)
+        return result
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        setattr(self._data, name, value)
 
+    def _delegate_method(self, name, *args, **kwargs):
+        result = operator.methodcaller(name, *args, **kwargs)(self._data)
+        return Index(result, name=self.name)
 
-class PeriodIndex(PeriodArrayMixin, DatelikeOps, DatetimeIndexOpsMixin,
-                  Int64Index):
+
+@delegate_names(PeriodArray,
+                PeriodArray._datetimelike_ops + ['size', 'asi8', 'shape'],
+                typ='property')
+@delegate_names(PeriodArray,
+                [x for x in PeriodArray._datetimelike_methods
+                 if x not in {"asfreq", "to_timestamp"}],
+                typ="method",
+                overwrite=True)
+class PeriodIndex(DatelikeOps, DatetimeIndexOpsMixin,
+                  Int64Index, PeriodDelegateMixin):
     """
     Immutable ndarray holding ordinal values indicating regular periods in
     time such as particular years, quarters, months, etc.
@@ -137,23 +182,16 @@ class PeriodIndex(PeriodArrayMixin, DatelikeOps, DatetimeIndexOpsMixin,
     _attributes = ['name', 'freq']
 
     # define my properties & methods for delegation
-    _other_ops = []
-    _bool_ops = ['is_leap_year']
-    _object_ops = ['start_time', 'end_time', 'freq']
-    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
-                  'weekofyear', 'weekday', 'week', 'dayofweek',
-                  'dayofyear', 'quarter', 'qyear',
-                  'days_in_month', 'daysinmonth']
-    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
-    _datetimelike_methods = ['strftime', 'to_timestamp', 'asfreq']
-
     _is_numeric_dtype = False
     _infer_as_myclass = True
 
-    _freq = None
+    _data = None  # type: PeriodArray
 
     _engine_type = libindex.PeriodEngine
 
+    # ------------------------------------------------------------------------
+    # Index Constructors
+
     def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
                 periods=None, tz=None, dtype=None, copy=False, name=None,
                 **fields):
@@ -168,85 +206,214 @@ def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
         if name is None and hasattr(data, 'name'):
             name = data.name
 
-        freq = dtl.validate_dtype_freq(dtype, freq)
+        if data is None and ordinal is None:
+            # range-based.
+            if periods is not None:
+                if is_float(periods):
+                    periods = int(periods)
 
-        # coerce freq to freq object, otherwise it can be coerced elementwise
-        # which is slow
-        if freq:
-            freq = Period._maybe_convert_freq(freq)
+                elif not is_integer(periods):
+                    msg = 'periods must be a number, got {periods}'
+                    raise TypeError(msg.format(periods=periods))
 
-        if data is None:
-            if ordinal is not None:
-                data = np.asarray(ordinal, dtype=np.int64)
-            else:
-                data, freq = cls._generate_range(start, end, periods,
-                                                 freq, fields)
-            return cls._simple_new(data, name=name, freq=freq)
-
-        if isinstance(data, PeriodIndex):
-            if freq is None or freq == data.freq:  # no freq change
-                freq = data.freq
-                data = data._ndarray_values
+            data, freq = PeriodArray._generate_range(start, end, periods,
+                                                     freq, fields)
+            data = PeriodArray(data, freq=freq)
+        else:
+            if freq is None and dtype is not None:
+                freq = PeriodDtype(dtype).freq
+            elif freq and dtype:
+                freq = PeriodDtype(freq).freq
+                dtype = PeriodDtype(dtype).freq
+
+                if freq != dtype:
+                    msg = "specified freq and dtype are different"
+                    raise IncompatibleFrequency(msg)
+
+            # PeriodIndex allow PeriodIndex(period_index, freq=different)
+            # Let's not encourage that kind of behavior in PeriodArray.
+
+            if freq and isinstance(data, cls) and data.freq != freq:
+                # TODO: We can do some of these with no-copy / coercion?
+                # e.g. D -> 2D seems to be OK
+                data = data.asfreq(freq)
+
+            if data is None and ordinal is not None:
+                # we strangely ignore `ordinal` if data is passed.
+                ordinal = np.asarray(ordinal, dtype=np.int64)
+                data = PeriodArray(ordinal, freq)
             else:
-                base1, _ = _gfc(data.freq)
-                base2, _ = _gfc(freq)
-                data = period.period_asfreq_arr(data._ndarray_values,
-                                                base1, base2, 1)
-            return cls._simple_new(data, name=name, freq=freq)
-
-        # not array / index
-        if not isinstance(data, (np.ndarray, PeriodIndex,
-                                 DatetimeIndex, Int64Index)):
-            if is_scalar(data):
-                cls._scalar_data_error(data)
-
-            # other iterable of some kind
-            if not isinstance(data, (list, tuple)):
-                data = list(data)
-
-            data = np.asarray(data)
-
-        # datetime other than period
-        if is_datetime64_dtype(data.dtype):
-            data = dt64arr_to_periodarr(data, freq, tz)
-            return cls._simple_new(data, name=name, freq=freq)
-
-        # check not floats
-        if infer_dtype(data) == 'floating' and len(data) > 0:
-            raise TypeError("PeriodIndex does not allow "
-                            "floating point in construction")
-
-        # anything else, likely an array of strings or periods
-        data = ensure_object(data)
-        freq = freq or period.extract_freq(data)
-        data = period.extract_ordinals(data, freq)
-        return cls._simple_new(data, name=name, freq=freq)
+                # don't pass copy here, since we copy later.
+                data = period_array(data=data, freq=freq)
 
-    @cache_readonly
-    def _engine(self):
-        return self._engine_type(lambda: self, len(self))
+        if copy:
+            data = data.copy()
+
+        return cls._simple_new(data, name=name)
 
     @classmethod
-    def _simple_new(cls, values, freq=None, name=None, **kwargs):
-        result = super(PeriodIndex, cls)._simple_new(values, freq)
+    def _simple_new(cls, values, name=None, freq=None, **kwargs):
+        """
+        Create a new PeriodIndex.
+
+        Parameters
+        ----------
+        values : PeriodArray, PeriodIndex, Index[int64], ndarray[int64]
+            Values that can be converted to a PeriodArray without inference
+            or coercion.
 
+        """
+        # TODO: raising on floats is tested, but maybe not useful.
+        # Should the callers know not to pass floats?
+        # At the very least, I think we can ensure that lists aren't passed.
+        if isinstance(values, list):
+            values = np.asarray(values)
+        if is_float_dtype(values):
+            raise TypeError("PeriodIndex._simple_new does not accept floats.")
+        values = PeriodArray(values, freq=freq)
+
+        if not isinstance(values, PeriodArray):
+            raise TypeError("PeriodIndex._simple_new only accepts PeriodArray")
+        result = object.__new__(cls)
+        result._data = values
         result.name = name
         result._reset_identity()
         return result
 
-    def _shallow_copy_with_infer(self, values, **kwargs):
+    # ------------------------------------------------------------------------
+    # Data
+    @property
+    def _ndarray_values(self):
+        return self._data._ndarray_values
+
+    @property
+    def values(self):
+        return np.asarray(self)
+
+    @property
+    def _values(self):
+        return self._data
+
+    @property
+    def freq(self):
+        # TODO(DatetimeArray): remove
+        # Can't simply use delegate_names since our base class is defining
+        # freq
+        return self._data.freq
+
+    @freq.setter
+    def freq(self, value):
+        value = Period._maybe_convert_freq(value)
+        msg = ('Setting {cls}.freq has been deprecated and will be '
+               'removed in a future version; use {cls}.asfreq instead. '
+               'The {cls}.freq setter is not guaranteed to work.')
+        warnings.warn(msg.format(cls=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        # PeriodArray._freq isn't actually mutable. We set the private _freq
+        # here, but people shouldn't be doing this anyway.
+        self._data._freq = value
+
+    def _shallow_copy(self, values=None, **kwargs):
+        # TODO: simplify, figure out type of values
+        if values is None:
+            values = self._data
+
+        if isinstance(values, type(self)):
+            values = values._values
+
+        if not isinstance(values, PeriodArray):
+            if (isinstance(values, np.ndarray) and
+                    is_integer_dtype(values.dtype)):
+                values = PeriodArray(values, freq=self.freq)
+            else:
+                # in particular, I would like to avoid period_array here.
+                # Some people seem to be calling use with unexpected types
+                # Index.difference -> ndarray[Period]
+                # DatetimelikeIndexOpsMixin.repeat -> ndarray[ordinal]
+                # I think that once all of Datetime* are EAs, we can simplify
+                # this quite a bit.
+                values = period_array(values, freq=self.freq)
+
+        # I don't like overloading shallow_copy with freq changes.
+        # See if it's used anywhere outside of test_resample_empty_dataframe
+        attributes = self._get_attributes_dict()
+        freq = kwargs.pop("freq", None)
+        if freq:
+            values = values.asfreq(freq)
+            attributes.pop("freq", None)
+
+        attributes.update(kwargs)
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+        return self._simple_new(values, **attributes)
+
+    def _shallow_copy_with_infer(self, values=None, **kwargs):
         """ we always want to return a PeriodIndex """
         return self._shallow_copy(values=values, **kwargs)
 
-    def _coerce_scalar_to_index(self, item):
-        """
-        we need to coerce a scalar to a compat for our index type
+    @property
+    def _box_func(self):
+        """Maybe box an ordinal or Period"""
+        # TODO(DatetimeArray): Avoid double-boxing
+        # PeriodArray takes care of boxing already, so we need to check
+        # whether we're given an ordinal or a Period. It seems like some
+        # places outside of indexes/period.py are calling this _box_func,
+        # but passing data that's already boxed.
+        def func(x):
+            if isinstance(x, Period) or x is tslib.NaT:
+                return x
+            else:
+                return Period._from_ordinal(ordinal=x, freq=self.freq)
+        return func
 
-        Parameters
-        ----------
-        item : scalar item to coerce
+    def _maybe_box_as_values(self, values, **attribs):
+        """Box an array of ordinals to a PeriodArray
+
+        This is purely for compatibility between PeriodIndex
+        and Datetime/TimedeltaIndex. Once these are all backed by
+        an ExtensionArray, this can be removed
         """
-        return PeriodIndex([item], **self._get_attributes_dict())
+        # TODO(DatetimeArray): remove
+        freq = attribs['freq']
+        return PeriodArray(values, freq=freq)
+
+    # ------------------------------------------------------------------------
+    # Dispatch and maybe box. Not done in delegate_names because we box
+    # different from those (which use Index).
+
+    def asfreq(self, freq=None, how='E'):
+        result = self._data.asfreq(freq=freq, how=how)
+        return self._simple_new(result, name=self.name)
+
+    def _nat_new(self, box=True):
+        # TODO(DatetimeArray): remove this
+        result = self._data._nat_new(box=box)
+        if box:
+            result = self._simple_new(result, name=self.name)
+        return result
+
+    def to_timestamp(self, freq=None, how='start'):
+        from pandas import DatetimeIndex
+        result = self._data.to_timestamp(freq=freq, how=how)
+        return DatetimeIndex._simple_new(result,
+                                         name=self.name,
+                                         freq=result.freq)
+
+    def _format_native_types(self, na_rep=u'NaT', quoting=None, **kwargs):
+        # just dispatch, return ndarray
+        return self._data._format_native_types(na_rep=na_rep,
+                                               quoting=quoting,
+                                               **kwargs)
+
+    def _maybe_convert_timedelta(self, other):
+        # just dispatch, return ndarray
+        return self._data._maybe_convert_timedelta(other)
+
+    # ------------------------------------------------------------------------
+    # Indexing
+    @cache_readonly
+    def _engine(self):
+        return self._engine_type(lambda: self, len(self))
 
     @Appender(_index_shared_docs['__contains__'])
     def __contains__(self, key):
@@ -268,9 +435,46 @@ def __contains__(self, key):
     def _int64index(self):
         return Int64Index._simple_new(self.asi8, name=self.name)
 
-    @property
-    def values(self):
-        return self.astype(object).values
+    # ------------------------------------------------------------------------
+    # Index Methods
+
+    @deprecate_kwarg(old_arg_name='n', new_arg_name='periods')
+    def shift(self, periods):
+        """
+        Shift index by desired number of increments.
+
+        This method is for shifting the values of period indexes
+        by a specified time increment.
+
+        Parameters
+        ----------
+        periods : int, default 1
+            Number of periods (or increments) to shift by,
+            can be positive or negative.
+
+            .. versionchanged:: 0.24.0
+
+        Returns
+        -------
+        pandas.PeriodIndex
+            Shifted index.
+
+        See Also
+        --------
+        DatetimeIndex.shift : Shift values of DatetimeIndex.
+        """
+        i8values = self._data._time_shift(periods)
+        return self._simple_new(i8values, name=self.name, freq=self.freq)
+
+    def _coerce_scalar_to_index(self, item):
+        """
+        we need to coerce a scalar to a compat for our index type
+
+        Parameters
+        ----------
+        item : scalar item to coerce
+        """
+        return PeriodIndex([item], **self._get_attributes_dict())
 
     def __array__(self, dtype=None):
         if is_integer_dtype(dtype):
@@ -312,16 +516,6 @@ def __array_wrap__(self, result, context=None):
         # cannot pass _simple_new as it is
         return type(self)(result, freq=self.freq, name=self.name)
 
-    @property
-    def size(self):
-        # Avoid materializing self._values
-        return self._ndarray_values.size
-
-    @property
-    def shape(self):
-        # Avoid materializing self._values
-        return self._ndarray_values.shape
-
     @property
     def _formatter_func(self):
         return lambda x: "'%s'" % x
@@ -351,14 +545,17 @@ def asof_locs(self, where, mask):
     @Appender(_index_shared_docs['astype'])
     def astype(self, dtype, copy=True, how='start'):
         dtype = pandas_dtype(dtype)
-        if is_integer_dtype(dtype):
-            return self._int64index.copy() if copy else self._int64index
-        elif is_datetime64_any_dtype(dtype):
+
+        # We have a few special-cases for `dtype`.
+        # Failing those, we fall back to astyping the values
+
+        if is_datetime64_any_dtype(dtype):
+            # 'how' is index-speicifc, isn't part of the EA interface.
             tz = getattr(dtype, 'tz', None)
             return self.to_timestamp(how=how).tz_localize(tz)
-        elif is_period_dtype(dtype):
-            return self.asfreq(freq=dtype.freq)
-        return super(PeriodIndex, self).astype(dtype, copy=copy)
+
+        result = self._data.astype(dtype, copy=copy)
+        return Index(result, name=self.name, dtype=dtype, copy=False)
 
     @Substitution(klass='PeriodIndex')
     @Appender(_shared_docs['searchsorted'])
@@ -391,34 +588,6 @@ def is_full(self):
         values = self.asi8
         return ((values[1:] - values[:-1]) < 2).all()
 
-    year = wrap_field_accessor(PeriodArrayMixin.year)
-    month = wrap_field_accessor(PeriodArrayMixin.month)
-    day = wrap_field_accessor(PeriodArrayMixin.day)
-    hour = wrap_field_accessor(PeriodArrayMixin.hour)
-    minute = wrap_field_accessor(PeriodArrayMixin.minute)
-    second = wrap_field_accessor(PeriodArrayMixin.second)
-    weekofyear = wrap_field_accessor(PeriodArrayMixin.week)
-    week = weekofyear
-    dayofweek = wrap_field_accessor(PeriodArrayMixin.dayofweek)
-    weekday = dayofweek
-    dayofyear = day_of_year = wrap_field_accessor(PeriodArrayMixin.dayofyear)
-    quarter = wrap_field_accessor(PeriodArrayMixin.quarter)
-    qyear = wrap_field_accessor(PeriodArrayMixin.qyear)
-    days_in_month = wrap_field_accessor(PeriodArrayMixin.days_in_month)
-    daysinmonth = days_in_month
-
-    to_timestamp = wrap_array_method(PeriodArrayMixin.to_timestamp, True)
-
-    @property
-    @Appender(PeriodArrayMixin.start_time.__doc__)
-    def start_time(self):
-        return PeriodArrayMixin.start_time.fget(self)
-
-    @property
-    @Appender(PeriodArrayMixin.end_time.__doc__)
-    def end_time(self):
-        return PeriodArrayMixin.end_time.fget(self)
-
     def _mpl_repr(self):
         # how to represent ourselves to matplotlib
         return self.astype(object).values
@@ -677,25 +846,6 @@ def _apply_meta(self, rawarr):
                                              name=self.name)
         return rawarr
 
-    def _format_native_types(self, na_rep=u'NaT', date_format=None, **kwargs):
-
-        values = self.astype(object).values
-
-        if date_format:
-            formatter = lambda dt: dt.strftime(date_format)
-        else:
-            formatter = lambda dt: u'%s' % dt
-
-        if self.hasnans:
-            mask = self._isnan
-            values[mask] = na_rep
-            imask = ~mask
-            values[imask] = np.array([formatter(dt) for dt
-                                      in values[imask]])
-        else:
-            values = np.array([formatter(dt) for dt in values])
-        return values
-
     def __setstate__(self, state):
         """Necessary for making this object picklable"""
 
@@ -711,12 +861,14 @@ def __setstate__(self, state):
                 np.ndarray.__setstate__(data, nd_state)
 
                 # backcompat
-                self._freq = Period._maybe_convert_freq(own_state[1])
+                freq = Period._maybe_convert_freq(own_state[1])
 
             else:  # pragma: no cover
                 data = np.empty(state)
                 np.ndarray.__setstate__(self, state)
+                freq = None  # ?
 
+            data = PeriodArray(data, freq=freq)
             self._data = data
 
         else:
@@ -724,6 +876,105 @@ def __setstate__(self, state):
 
     _unpickle_compat = __setstate__
 
+    @classmethod
+    def _add_datetimelike_methods(cls):
+        """
+        add in the datetimelike methods (as we may have to override the
+        superclass)
+        """
+        # TODO(DatetimeArray): move this up to DatetimeArrayMixin
+
+        def __add__(self, other):
+            # dispatch to ExtensionArray implementation
+            result = self._data.__add__(other)
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__add__ = __add__
+
+        def __radd__(self, other):
+            # alias for __add__
+            return self.__add__(other)
+        cls.__radd__ = __radd__
+
+        def __sub__(self, other):
+            # dispatch to ExtensionArray implementation
+            result = self._data.__sub__(other)
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__sub__ = __sub__
+
+        def __rsub__(self, other):
+            result = self._data.__rsub__(other)
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__rsub__ = __rsub__
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        """
+        Create a comparison method that dispatches to ``cls.values``.
+        """
+        # TODO(DatetimeArray): move to base class.
+        def wrapper(self, other):
+            return op(self._data, other)
+
+        wrapper.__doc__ = op.__doc__
+        wrapper.__name__ = '__{}__'.format(op.__name__)
+        return wrapper
+
+    def repeat(self, repeats, *args, **kwargs):
+        # TODO(DatetimeArray): Just use Index.repeat
+        return Index.repeat(self, repeats, *args, **kwargs)
+
+    def view(self, dtype=None, type=None):
+        # TODO(DatetimeArray): remove
+        if dtype is None or dtype is __builtins__['type'](self):
+            return self
+        return self._ndarray_values.view(dtype=dtype)
+
+    @property
+    def flags(self):
+        """ return the ndarray.flags for the underlying data """
+        warnings.warn("{obj}.flags is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.flags
+
+    @property
+    def asi8(self):
+        # TODO(DatetimeArray): remove
+        return self.view('i8')
+
+    def item(self):
+        """ return the first element of the underlying data as a python
+        scalar
+        """
+        # TODO(DatetimeArray): remove
+        if len(self) == 1:
+            return self[0]
+        else:
+            # copy numpy's message here because Py26 raises an IndexError
+            raise ValueError('can only convert an array of size 1 to a '
+                             'Python scalar')
+
+    @property
+    def data(self):
+        """ return the data pointer of the underlying data """
+        warnings.warn("{obj}.data is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return np.asarray(self._data).data
+
+    @property
+    def base(self):
+        """ return the base object if the memory of the underlying data is
+        shared
+        """
+        warnings.warn("{obj}.base is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return np.asarray(self._data)
+
 
 PeriodIndex._add_comparison_ops()
 PeriodIndex._add_numeric_methods_disabled()
diff --git a/pandas/core/series.py b/pandas/core/series.py
index 7ebbe0dfb4bb7..d3ea005d3aae7 100644
--- a/pandas/core/series.py
+++ b/pandas/core/series.py
@@ -24,7 +24,7 @@
 from pandas.compat.numpy import function as nv
 from pandas.core import base, generic
 from pandas.core.accessor import CachedAccessor
-from pandas.core.arrays import ExtensionArray
+from pandas.core.arrays import ExtensionArray, period_array
 from pandas.core.arrays.categorical import Categorical, CategoricalAccessor
 from pandas.core.config import get_option
 from pandas.core.dtypes.cast import (
@@ -135,8 +135,9 @@ class Series(base.IndexOpsMixin, generic.NDFrame):
         RangeIndex (0, 1, 2, ..., n) if not provided. If both a dict and index
         sequence are used, the index will override the keys found in the
         dict.
-    dtype : numpy.dtype or None
-        If None, dtype will be inferred
+    dtype : str, numpy.dtype, or ExtensionDtype, optional
+        dtype for the output Series. If not specified, this will be
+        inferred from `data`.
     copy : boolean, default False
         Copy input data
     """
@@ -643,7 +644,8 @@ def __array_prepare__(self, result, context=None):
 
         # nice error message for non-ufunc types
         if (context is not None and
-                not isinstance(self._values, (np.ndarray, ABCSparseArray))):
+                (not isinstance(self._values, (np.ndarray, ExtensionArray))
+                 or isinstance(self._values, Categorical))):
             obj = context[1][0]
             raise TypeError("{obj} with dtype {dtype} cannot perform "
                             "the numpy op {op}".format(
@@ -4357,4 +4359,12 @@ def _try_cast(arr, take_fast_path):
                 data = np.array(data, dtype=dtype, copy=False)
             subarr = np.array(data, dtype=object, copy=copy)
 
+    if is_object_dtype(subarr.dtype) and dtype != 'object':
+        inferred = lib.infer_dtype(subarr)
+        if inferred == 'period':
+            try:
+                subarr = period_array(subarr)
+            except tslibs.period.IncompatibleFrequency:
+                pass
+
     return subarr
diff --git a/pandas/io/packers.py b/pandas/io/packers.py
index 73b9e1dfc24e7..764e27a60abb5 100644
--- a/pandas/io/packers.py
+++ b/pandas/io/packers.py
@@ -53,7 +53,7 @@
 )
 from pandas.compat import u, u_safe
 from pandas.core import internals
-from pandas.core.arrays import IntervalArray
+from pandas.core.arrays import IntervalArray, PeriodArray
 from pandas.core.arrays.sparse import BlockIndex, IntIndex
 from pandas.core.dtypes.common import (
     is_categorical_dtype, is_object_dtype, needs_i8_conversion, pandas_dtype
@@ -599,7 +599,9 @@ def decode(obj):
     elif typ == u'period_index':
         data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
         d = dict(name=obj[u'name'], freq=obj[u'freq'])
-        return globals()[obj[u'klass']]._from_ordinals(data, **d)
+        freq = d.pop('freq', None)
+        return globals()[obj[u'klass']](PeriodArray(data, freq), **d)
+
     elif typ == u'datetime_index':
         data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
         d = dict(name=obj[u'name'], freq=obj[u'freq'], verify_integrity=False)
diff --git a/pandas/tests/arithmetic/test_period.py b/pandas/tests/arithmetic/test_period.py
index 4ccebd4305b90..cff2c25231220 100644
--- a/pandas/tests/arithmetic/test_period.py
+++ b/pandas/tests/arithmetic/test_period.py
@@ -270,8 +270,8 @@ def test_ops_frame_period(self):
                                  pd.Period('2015-02', freq='M')],
                            'B': [pd.Period('2014-01', freq='M'),
                                  pd.Period('2014-02', freq='M')]})
-        assert df['A'].dtype == object
-        assert df['B'].dtype == object
+        assert df['A'].dtype == 'Period[M]'
+        assert df['B'].dtype == 'Period[M]'
 
         p = pd.Period('2015-03', freq='M')
         off = p.freq
@@ -285,8 +285,8 @@ def test_ops_frame_period(self):
                                   pd.Period('2015-06', freq='M')],
                             'B': [pd.Period('2015-05', freq='M'),
                                   pd.Period('2015-06', freq='M')]})
-        assert df2['A'].dtype == object
-        assert df2['B'].dtype == object
+        assert df2['A'].dtype == 'Period[M]'
+        assert df2['B'].dtype == 'Period[M]'
 
         exp = pd.DataFrame({'A': np.array([4 * off, 4 * off], dtype=object),
                             'B': np.array([16 * off, 16 * off], dtype=object)})
@@ -642,7 +642,7 @@ def test_pi_sub_isub_timedeltalike_daily(self, three_days):
     def test_pi_add_sub_timedeltalike_freq_mismatch_daily(self, not_daily):
         other = not_daily
         rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=D\\)'
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=D\\)'
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
             rng + other
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
@@ -667,7 +667,7 @@ def test_pi_add_iadd_timedeltalike_hourly(self, two_hours):
     def test_pi_add_timedeltalike_mismatched_freq_hourly(self, not_hourly):
         other = not_hourly
         rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
-        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=H\\)'
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=H\\)'
 
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
             rng + other
@@ -702,7 +702,7 @@ def test_pi_add_sub_timedeltalike_freq_mismatch_annual(self,
         other = mismatched_freq
         rng = pd.period_range('2014', '2024', freq='A')
         msg = ('Input has different freq(=.+)? '
-               'from PeriodIndex\\(freq=A-DEC\\)')
+               'from Period.*?\\(freq=A-DEC\\)')
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
             rng + other
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
@@ -726,7 +726,7 @@ def test_pi_add_sub_timedeltalike_freq_mismatch_monthly(self,
                                                             mismatched_freq):
         other = mismatched_freq
         rng = pd.period_range('2014-01', '2016-12', freq='M')
-        msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=M\\)'
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=M\\)'
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
             rng + other
         with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
@@ -742,7 +742,7 @@ def test_ops_series_timedelta(self):
         # GH 13043
         ser = pd.Series([pd.Period('2015-01-01', freq='D'),
                          pd.Period('2015-01-02', freq='D')], name='xxx')
-        assert ser.dtype == object
+        assert ser.dtype == 'Period[D]'
 
         expected = pd.Series([pd.Period('2015-01-02', freq='D'),
                               pd.Period('2015-01-03', freq='D')], name='xxx')
@@ -763,7 +763,7 @@ def test_ops_series_period(self):
         # GH 13043
         ser = pd.Series([pd.Period('2015-01-01', freq='D'),
                          pd.Period('2015-01-02', freq='D')], name='xxx')
-        assert ser.dtype == object
+        assert ser.dtype == "Period[D]"
 
         per = pd.Period('2015-01-10', freq='D')
         off = per.freq
@@ -774,7 +774,7 @@ def test_ops_series_period(self):
 
         s2 = pd.Series([pd.Period('2015-01-05', freq='D'),
                         pd.Period('2015-01-04', freq='D')], name='xxx')
-        assert s2.dtype == object
+        assert s2.dtype == "Period[D]"
 
         expected = pd.Series([4 * off, 2 * off], name='xxx', dtype=object)
         tm.assert_series_equal(s2 - ser, expected)
@@ -916,9 +916,8 @@ def test_pi_offset_errors(self):
 
         # Series op is applied per Period instance, thus error is raised
         # from Period
-        msg_idx = r"Input has different freq from PeriodIndex\(freq=D\)"
-        msg_s = r"Input cannot be converted to Period\(freq=D\)"
-        for obj, msg in [(idx, msg_idx), (ser, msg_s)]:
+        msg = r"Input has different freq from Period.*?\(freq=D\)"
+        for obj in [idx, ser]:
             with tm.assert_raises_regex(period.IncompatibleFrequency, msg):
                 obj + pd.offsets.Hour(2)
 
diff --git a/pandas/tests/arrays/test_datetimelike.py b/pandas/tests/arrays/test_datetimelike.py
index d0099aed00285..8baf53e65ba22 100644
--- a/pandas/tests/arrays/test_datetimelike.py
+++ b/pandas/tests/arrays/test_datetimelike.py
@@ -7,7 +7,7 @@
 
 from pandas.core.arrays import (DatetimeArrayMixin,
                                 TimedeltaArrayMixin,
-                                PeriodArrayMixin)
+                                PeriodArray)
 
 
 # TODO: more freq variants
@@ -100,7 +100,7 @@ def test_to_period(self, datetime_index, freqstr):
 
         expected = dti.to_period(freq=freqstr)
         result = arr.to_period(freq=freqstr)
-        assert isinstance(result, PeriodArrayMixin)
+        assert isinstance(result, PeriodArray)
 
         # placeholder until these become actual EA subclasses and we can use
         #  an EA-specific tm.assert_ function
@@ -181,7 +181,7 @@ class TestPeriodArray(object):
 
     def test_from_pi(self, period_index):
         pi = period_index
-        arr = PeriodArrayMixin(pi)
+        arr = PeriodArray(pi)
         assert list(arr) == list(pi)
 
         # Check that Index.__new__ knows what to do with PeriodArray
@@ -191,7 +191,7 @@ def test_from_pi(self, period_index):
 
     def test_astype_object(self, period_index):
         pi = period_index
-        arr = PeriodArrayMixin(pi)
+        arr = PeriodArray(pi)
         asobj = arr.astype('O')
         assert isinstance(asobj, np.ndarray)
         assert asobj.dtype == 'O'
@@ -200,7 +200,7 @@ def test_astype_object(self, period_index):
     @pytest.mark.parametrize('how', ['S', 'E'])
     def test_to_timestamp(self, how, period_index):
         pi = period_index
-        arr = PeriodArrayMixin(pi)
+        arr = PeriodArray(pi)
 
         expected = DatetimeArrayMixin(pi.to_timestamp(how=how))
         result = arr.to_timestamp(how=how)
@@ -210,21 +210,21 @@ def test_to_timestamp(self, how, period_index):
         #  an EA-specific tm.assert_ function
         tm.assert_index_equal(pd.Index(result), pd.Index(expected))
 
-    @pytest.mark.parametrize('propname', pd.PeriodIndex._bool_ops)
+    @pytest.mark.parametrize('propname', PeriodArray._bool_ops)
     def test_bool_properties(self, period_index, propname):
         # in this case _bool_ops is just `is_leap_year`
         pi = period_index
-        arr = PeriodArrayMixin(pi)
+        arr = PeriodArray(pi)
 
         result = getattr(arr, propname)
         expected = np.array(getattr(pi, propname))
 
         tm.assert_numpy_array_equal(result, expected)
 
-    @pytest.mark.parametrize('propname', pd.PeriodIndex._field_ops)
+    @pytest.mark.parametrize('propname', PeriodArray._field_ops)
     def test_int_properties(self, period_index, propname):
         pi = period_index
-        arr = PeriodArrayMixin(pi)
+        arr = PeriodArray(pi)
 
         result = getattr(arr, propname)
         expected = np.array(getattr(pi, propname))
diff --git a/pandas/tests/arrays/test_period.py b/pandas/tests/arrays/test_period.py
new file mode 100644
index 0000000000000..780df579d2778
--- /dev/null
+++ b/pandas/tests/arrays/test_period.py
@@ -0,0 +1,206 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas._libs.tslibs import iNaT
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas.core.arrays import PeriodArray, period_array
+from pandas.core.dtypes.common import pandas_dtype
+from pandas.core.dtypes.dtypes import PeriodDtype
+
+# ----------------------------------------------------------------------------
+# Constructors
+
+# period_array
+
+
+@pytest.mark.parametrize("data, freq, expected", [
+    ([pd.Period("2017", "D")], None, [17167]),
+    ([pd.Period("2017", "D")], "D", [17167]),
+    ([2017], "D", [17167]),
+    (["2017"], "D", [17167]),
+    ([pd.Period("2017", "D")], pd.tseries.offsets.Day(), [17167]),
+    ([pd.Period("2017", "D"), None], None, [17167, iNaT]),
+    (pd.Series(pd.date_range("2017", periods=3)), None,
+     [17167, 17168, 17169]),
+    (pd.date_range("2017", periods=3), None, [17167, 17168, 17169]),
+])
+def test_period_array_ok(data, freq, expected):
+    result = period_array(data, freq=freq).asi8
+    expected = np.asarray(expected, dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_from_datetime64_raises():
+    arr = pd.date_range("2017", periods=3, freq="D")
+    with tm.assert_raises_regex(IncompatibleFrequency, "freq"):
+        PeriodArray._from_datetime64(arr, freq="M")
+
+
+@pytest.mark.parametrize("data, freq, msg", [
+    ([pd.Period('2017', 'D'),
+      pd.Period('2017', 'A')],
+     None,
+     "Input has different freq"),
+    ([pd.Period('2017', 'D')],
+     "A",
+     "Input has different freq"),
+])
+def test_period_array_raises(data, freq, msg):
+    with tm.assert_raises_regex(IncompatibleFrequency, msg):
+        period_array(data, freq)
+
+
+def test_period_array_non_period_series_raies():
+    ser = pd.Series([1, 2, 3])
+    with tm.assert_raises_regex(TypeError, 'dtype'):
+        PeriodArray(ser, freq='D')
+
+
+def test_period_array_freq_mismatch():
+    arr = period_array(['2000', '2001'], freq='D')
+    with tm.assert_raises_regex(IncompatibleFrequency, 'freq'):
+        PeriodArray(arr, freq='M')
+
+    with tm.assert_raises_regex(IncompatibleFrequency, 'freq'):
+        PeriodArray(arr, freq=pd.tseries.offsets.MonthEnd())
+
+
+def test_asi8():
+    result = period_array(['2000', '2001', None], freq='D').asi8
+    expected = np.array([10957, 11323, iNaT])
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_take_raises():
+    arr = period_array(['2000', '2001'], freq='D')
+    with tm.assert_raises_regex(IncompatibleFrequency, 'freq'):
+        arr.take([0, -1], allow_fill=True,
+                 fill_value=pd.Period('2000', freq='W'))
+
+    with tm.assert_raises_regex(ValueError, 'foo'):
+        arr.take([0, -1], allow_fill=True, fill_value='foo')
+
+
+@pytest.mark.parametrize('dtype', [int, np.int32, np.int64])
+def test_astype(dtype):
+    # Need to ensure ordinals are astyped correctly for both
+    # int32 and 64
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(dtype)
+    # need pandas_dtype to handle int32 vs. int64 correctly
+    expected = pandas_dtype(dtype)
+    assert result.dtype == expected
+
+
+def test_astype_copies():
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(np.int64, copy=False)
+    assert result is arr._data
+
+    result = arr.astype(np.int64, copy=True)
+    assert result is not arr._data
+
+
+def test_astype_categorical():
+    arr = period_array(['2000', '2001', '2001', None], freq='D')
+    result = arr.astype('category')
+    categories = pd.PeriodIndex(['2000', '2001'], freq='D')
+    expected = pd.Categorical.from_codes([0, 1, 1, -1], categories=categories)
+    tm.assert_categorical_equal(result, expected)
+
+
+def test_astype_period():
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(PeriodDtype("M"))
+    expected = period_array(['2000', '2001', None], freq='M')
+    tm.assert_period_array_equal(result, expected)
+
+
+@pytest.mark.parametrize('other', [
+    'datetime64[ns]', 'timedelta64[ns]',
+])
+def test_astype_datetime(other):
+    arr = period_array(['2000', '2001', None], freq='D')
+    # slice off the [ns] so that the regex matches.
+    with tm.assert_raises_regex(TypeError, other[:-4]):
+        arr.astype(other)
+
+
+def test_fillna_raises():
+    arr = period_array(['2000', '2001', '2002'], freq='D')
+    with tm.assert_raises_regex(ValueError, 'Length'):
+        arr.fillna(arr[:2])
+
+
+def test_fillna_copies():
+    arr = period_array(['2000', '2001', '2002'], freq='D')
+    result = arr.fillna(pd.Period("2000", "D"))
+    assert result is not arr
+
+
+# ----------------------------------------------------------------------------
+# setitem
+
+@pytest.mark.parametrize('key, value, expected', [
+    ([0], pd.Period("2000", "D"), [10957, 1, 2]),
+    ([0], None, [iNaT, 1, 2]),
+    ([0], np.nan, [iNaT, 1, 2]),
+    ([0, 1, 2], pd.Period("2000", "D"), [10957] * 3),
+    ([0, 1, 2], [pd.Period("2000", "D"),
+                 pd.Period("2001", "D"),
+                 pd.Period("2002", "D")],
+     [10957, 11323, 11688]),
+])
+def test_setitem(key, value, expected):
+    arr = PeriodArray(np.arange(3), freq="D")
+    expected = PeriodArray(expected, freq="D")
+    arr[key] = value
+    tm.assert_period_array_equal(arr, expected)
+
+
+def test_setitem_raises_incompatible_freq():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with tm.assert_raises_regex(IncompatibleFrequency, "freq"):
+        arr[0] = pd.Period("2000", freq="A")
+
+    other = period_array(['2000', '2001'], freq='A')
+    with tm.assert_raises_regex(IncompatibleFrequency, "freq"):
+        arr[[0, 1]] = other
+
+
+def test_setitem_raises_length():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with tm.assert_raises_regex(ValueError, "length"):
+        arr[[0, 1]] = [pd.Period("2000", freq="D")]
+
+
+def test_setitem_raises_type():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with tm.assert_raises_regex(TypeError, "int"):
+        arr[0] = 1
+
+
+# ----------------------------------------------------------------------------
+# Ops
+
+def tet_sub_period():
+    arr = period_array(['2000', '2001'], freq='D')
+    other = pd.Period("2000", freq="M")
+    with tm.assert_raises_regex(IncompatibleFrequency, "freq"):
+        arr - other
+
+
+# ----------------------------------------------------------------------------
+# other
+
+def test_maybe_convert_timedelta():
+    arr = period_array(['2000', '2001'], freq='D')
+    offset = pd.tseries.offsets.Day(2)
+    assert arr._maybe_convert_timedelta(offset) == 2
+    assert arr._maybe_convert_timedelta(2) == 2
+
+    offset = pd.tseries.offsets.BusinessDay()
+    with tm.assert_raises_regex(ValueError, 'freq'):
+        arr._maybe_convert_timedelta(offset)
diff --git a/pandas/tests/dtypes/test_concat.py b/pandas/tests/dtypes/test_concat.py
index b6c5c119ffb6f..35623415571c0 100644
--- a/pandas/tests/dtypes/test_concat.py
+++ b/pandas/tests/dtypes/test_concat.py
@@ -38,16 +38,14 @@ def test_get_dtype_kinds(klass, to_concat, expected):
 
 
 @pytest.mark.parametrize('to_concat, expected', [
-    # because we don't have Period dtype (yet),
-    # Series results in object dtype
     ([PeriodIndex(['2011-01'], freq='M'),
       PeriodIndex(['2011-01'], freq='M')], ['period[M]']),
     ([Series([Period('2011-01', freq='M')]),
-      Series([Period('2011-02', freq='M')])], ['object']),
+      Series([Period('2011-02', freq='M')])], ['period[M]']),
     ([PeriodIndex(['2011-01'], freq='M'),
       PeriodIndex(['2011-01'], freq='D')], ['period[M]', 'period[D]']),
     ([Series([Period('2011-01', freq='M')]),
-      Series([Period('2011-02', freq='D')])], ['object'])])
+      Series([Period('2011-02', freq='D')])], ['period[M]', 'period[D]'])])
 def test_get_dtype_kinds_period(to_concat, expected):
     result = _concat.get_dtype_kinds(to_concat)
     assert result == set(expected)
diff --git a/pandas/tests/dtypes/test_dtypes.py b/pandas/tests/dtypes/test_dtypes.py
index c53c2e5059cde..2927442f9b6ee 100644
--- a/pandas/tests/dtypes/test_dtypes.py
+++ b/pandas/tests/dtypes/test_dtypes.py
@@ -381,11 +381,9 @@ def test_basic(self):
         assert is_period(pidx)
 
         s = Series(pidx, name='A')
-        # dtypes
-        # series results in object dtype currently,
-        # is_period checks period_arraylike
-        assert not is_period_dtype(s.dtype)
-        assert not is_period_dtype(s)
+
+        assert is_period_dtype(s.dtype)
+        assert is_period_dtype(s)
         assert is_period(s)
 
         assert not is_period_dtype(np.dtype('float64'))
diff --git a/pandas/tests/extension/test_common.py b/pandas/tests/extension/test_common.py
index b6223ea96d7dd..a0a8f86a5d7b5 100644
--- a/pandas/tests/extension/test_common.py
+++ b/pandas/tests/extension/test_common.py
@@ -78,7 +78,6 @@ def test_astype_no_copy():
 
 @pytest.mark.parametrize('dtype', [
     dtypes.DatetimeTZDtype('ns', 'US/Central'),
-    dtypes.PeriodDtype("D"),
 ])
 def test_is_not_extension_array_dtype(dtype):
     assert not isinstance(dtype, dtypes.ExtensionDtype)
diff --git a/pandas/tests/extension/test_integer.py b/pandas/tests/extension/test_integer.py
index 668939e775148..26b09d545378b 100644
--- a/pandas/tests/extension/test_integer.py
+++ b/pandas/tests/extension/test_integer.py
@@ -143,11 +143,6 @@ def test_error(self, data, all_arithmetic_operators):
         # other specific errors tested in the integer array specific tests
         pass
 
-    def test_add_series_with_extension_array(self, data):
-        super(TestArithmeticOps, self).test_add_series_with_extension_array(
-            data
-        )
-
 
 class TestComparisonOps(base.BaseComparisonOpsTests):
 
diff --git a/pandas/tests/extension/test_period.py b/pandas/tests/extension/test_period.py
new file mode 100644
index 0000000000000..6f59cbb66a145
--- /dev/null
+++ b/pandas/tests/extension/test_period.py
@@ -0,0 +1,155 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas._libs.tslib import iNaT
+from pandas.core.arrays import PeriodArray
+from pandas.core.dtypes.dtypes import PeriodDtype
+from pandas.tests.extension import base
+
+
+@pytest.fixture
+def dtype():
+    return PeriodDtype(freq='D')
+
+
+@pytest.fixture
+def data(dtype):
+    return PeriodArray(np.arange(1970, 2070), freq=dtype.freq)
+
+
+@pytest.fixture
+def data_for_sorting(dtype):
+    return PeriodArray([2018, 2019, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_missing(dtype):
+    return PeriodArray([iNaT, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_missing_for_sorting(dtype):
+    return PeriodArray([2018, iNaT, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_for_grouping(dtype):
+    B = 2018
+    NA = iNaT
+    A = 2017
+    C = 2019
+    return PeriodArray([B, B, NA, NA, A, A, B, C], freq=dtype.freq)
+
+
+@pytest.fixture
+def na_value():
+    return pd.NaT
+
+
+class BasePeriodTests(object):
+    pass
+
+
+class TestPeriodDtype(BasePeriodTests, base.BaseDtypeTests):
+    pass
+
+
+class TestConstructors(BasePeriodTests, base.BaseConstructorsTests):
+    pass
+
+
+class TestGetitem(BasePeriodTests, base.BaseGetitemTests):
+    pass
+
+
+class TestMethods(BasePeriodTests, base.BaseMethodsTests):
+
+    def test_combine_add(self, data_repeated):
+        # Period + Period is not defined.
+        pass
+
+
+class TestInterface(BasePeriodTests, base.BaseInterfaceTests):
+
+    def test_no_values_attribute(self, data):
+        # We have a values attribute.
+        pass
+
+
+class TestArithmeticOps(BasePeriodTests, base.BaseArithmeticOpsTests):
+    implements = {'__sub__', '__rsub__'}
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        # we implement substitution...
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def _check_divmod_op(self, s, op, other, exc=NotImplementedError):
+        super(TestArithmeticOps, self)._check_divmod_op(
+            s, op, other, exc=TypeError
+        )
+
+    def test_add_series_with_extension_array(self, data):
+        # we don't implement + for Period
+        s = pd.Series(data)
+        msg = (r"unsupported operand type\(s\) for \+: "
+               r"\'PeriodArray\' and \'PeriodArray\'")
+        with tm.assert_raises_regex(TypeError, msg):
+            s + data
+
+    def test_error(self):
+        pass
+
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        # Override to use __sub__ instead of __add__
+        other = pd.Series(data)
+        result = data.__sub__(other)
+        assert result is NotImplemented
+
+
+class TestCasting(BasePeriodTests, base.BaseCastingTests):
+    pass
+
+
+class TestComparisonOps(BasePeriodTests, base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        # the base test is not appropriate for us. We raise on comparison
+        # with (some) integers, depending on the value.
+        pass
+
+
+class TestMissing(BasePeriodTests, base.BaseMissingTests):
+    pass
+
+
+class TestReshaping(BasePeriodTests, base.BaseReshapingTests):
+    pass
+
+
+class TestSetitem(BasePeriodTests, base.BaseSetitemTests):
+    pass
+
+
+class TestGroupby(BasePeriodTests, base.BaseGroupbyTests):
+    pass
diff --git a/pandas/tests/frame/test_combine_concat.py b/pandas/tests/frame/test_combine_concat.py
index ece9559313ba0..a43c5c7257daa 100644
--- a/pandas/tests/frame/test_combine_concat.py
+++ b/pandas/tests/frame/test_combine_concat.py
@@ -741,6 +741,7 @@ def test_combine_first_timedelta(self):
         tm.assert_frame_equal(res, exp)
         assert res['TD'].dtype == 'timedelta64[ns]'
 
+    @pytest.mark.xfail(reason="GH-23079", strict=True)
     def test_combine_first_period(self):
         data1 = pd.PeriodIndex(['2011-01', 'NaT', '2011-03',
                                 '2011-04'], freq='M')
@@ -755,7 +756,7 @@ def test_combine_first_period(self):
                                  freq='M')
         exp = pd.DataFrame({'P': exp_dts}, index=[1, 2, 3, 4, 5, 7])
         tm.assert_frame_equal(res, exp)
-        assert res['P'].dtype == 'object'
+        assert res['P'].dtype == data1.dtype
 
         # different freq
         dts2 = pd.PeriodIndex(['2012-01-01', '2012-01-02',
diff --git a/pandas/tests/frame/test_constructors.py b/pandas/tests/frame/test_constructors.py
index 3a45e0b61184c..dbce4c88aefd7 100644
--- a/pandas/tests/frame/test_constructors.py
+++ b/pandas/tests/frame/test_constructors.py
@@ -582,14 +582,14 @@ def test_constructor_period(self):
         a = pd.PeriodIndex(['2012-01', 'NaT', '2012-04'], freq='M')
         b = pd.PeriodIndex(['2012-02-01', '2012-03-01', 'NaT'], freq='D')
         df = pd.DataFrame({'a': a, 'b': b})
-        assert df['a'].dtype == 'object'
-        assert df['b'].dtype == 'object'
+        assert df['a'].dtype == a.dtype
+        assert df['b'].dtype == b.dtype
 
         # list of periods
         df = pd.DataFrame({'a': a.astype(object).tolist(),
                            'b': b.astype(object).tolist()})
-        assert df['a'].dtype == 'object'
-        assert df['b'].dtype == 'object'
+        assert df['a'].dtype == a.dtype
+        assert df['b'].dtype == b.dtype
 
     def test_nested_dict_frame_constructor(self):
         rng = pd.period_range('1/1/2000', periods=5)
diff --git a/pandas/tests/frame/test_operators.py b/pandas/tests/frame/test_operators.py
index b2781952ea86d..20ca4bc7de43e 100644
--- a/pandas/tests/frame/test_operators.py
+++ b/pandas/tests/frame/test_operators.py
@@ -552,7 +552,8 @@ def test_arith_non_pandas_object(self):
         df = self.simple
 
         val1 = df.xs('a').values
-        added = DataFrame(df.values + val1, index=df.index, columns=df.columns)
+        added = DataFrame(df.values + val1, index=df.index,
+                          columns=df.columns)
         assert_frame_equal(df + val1, added)
 
         added = DataFrame((df.values.T + val1).T,
diff --git a/pandas/tests/frame/test_replace.py b/pandas/tests/frame/test_replace.py
index 49dba1c769572..bf755b1dac4b8 100644
--- a/pandas/tests/frame/test_replace.py
+++ b/pandas/tests/frame/test_replace.py
@@ -984,8 +984,11 @@ def test_replace_period(self):
                            'out_augmented_AUG_2011.json',
                            'out_augmented_JAN_2011.json'], columns=['fname'])
         assert set(df.fname.values) == set(d['fname'].keys())
+        # We don't support converting object -> specialized EA in
+        # replace yet.
         expected = DataFrame({'fname': [d['fname'][k]
-                                        for k in df.fname.values]})
+                                        for k in df.fname.values]},
+                             dtype=object)
         result = df.replace(d)
         assert_frame_equal(result, expected)
 
diff --git a/pandas/tests/frame/test_reshape.py b/pandas/tests/frame/test_reshape.py
index 9f6735c7ba2bf..ed3cc39052183 100644
--- a/pandas/tests/frame/test_reshape.py
+++ b/pandas/tests/frame/test_reshape.py
@@ -277,6 +277,8 @@ def test_unstack_fill_frame_timedelta(self):
                              index=['x', 'y', 'z'])
         assert_frame_equal(result, expected)
 
+    @pytest.mark.xfail(reason="GH-23077",
+                       strict=True)
     def test_unstack_fill_frame_period(self):
 
         # Test unstacking with period
diff --git a/pandas/tests/indexes/common.py b/pandas/tests/indexes/common.py
index ee91b3075b0a1..dc936af04e045 100644
--- a/pandas/tests/indexes/common.py
+++ b/pandas/tests/indexes/common.py
@@ -309,7 +309,8 @@ def test_ensure_copied_data(self):
             index_type = index.__class__
             result = index_type(index.values, copy=True, **init_kwargs)
             tm.assert_index_equal(index, result)
-            tm.assert_numpy_array_equal(index.values, result.values,
+            tm.assert_numpy_array_equal(index._ndarray_values,
+                                        result._ndarray_values,
                                         check_same='copy')
 
             if isinstance(index, PeriodIndex):
diff --git a/pandas/tests/indexes/period/test_astype.py b/pandas/tests/indexes/period/test_astype.py
index f2126487496c4..a5042b8c714c8 100644
--- a/pandas/tests/indexes/period/test_astype.py
+++ b/pandas/tests/indexes/period/test_astype.py
@@ -14,7 +14,7 @@ class TestPeriodIndexAsType(object):
     def test_astype_raises(self, dtype):
         # GH#13149, GH#13209
         idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
-        msg = 'Cannot cast PeriodIndex to dtype'
+        msg = 'Cannot cast PeriodArray to dtype'
         with tm.assert_raises_regex(TypeError, msg):
             idx.astype(dtype)
 
@@ -27,7 +27,7 @@ def test_astype_conversion(self):
                          [Period(NaT, freq='D')] * 3, dtype='object')
         tm.assert_index_equal(result, expected)
 
-        result = idx.astype(int)
+        result = idx.astype(np.int64)
         expected = Int64Index([16937] + [-9223372036854775808] * 3,
                               dtype=np.int64)
         tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/period/test_construction.py b/pandas/tests/indexes/period/test_construction.py
index d54dac5867845..e1cefaf5905ad 100644
--- a/pandas/tests/indexes/period/test_construction.py
+++ b/pandas/tests/indexes/period/test_construction.py
@@ -7,6 +7,7 @@
 from pandas.compat import lrange, PY3, text_type, lmap
 from pandas import (Period, PeriodIndex, period_range, offsets, date_range,
                     Series, Index)
+from pandas.core.dtypes.dtypes import PeriodDtype
 
 
 class TestPeriodIndex(object):
@@ -270,16 +271,6 @@ def test_constructor_simple_new(self):
         result = idx._simple_new(idx.astype('i8'), name='p', freq=idx.freq)
         tm.assert_index_equal(result, idx)
 
-        result = idx._simple_new([pd.Period('2007-01', freq='M'),
-                                  pd.Period('2007-02', freq='M')],
-                                 name='p', freq=idx.freq)
-        tm.assert_index_equal(result, idx)
-
-        result = idx._simple_new(np.array([pd.Period('2007-01', freq='M'),
-                                           pd.Period('2007-02', freq='M')]),
-                                 name='p', freq=idx.freq)
-        tm.assert_index_equal(result, idx)
-
     def test_constructor_simple_new_empty(self):
         # GH13079
         idx = PeriodIndex([], freq='M', name='p')
@@ -288,7 +279,6 @@ def test_constructor_simple_new_empty(self):
 
     @pytest.mark.parametrize('floats', [[1.1, 2.1], np.array([1.1, 2.1])])
     def test_constructor_floats(self, floats):
-        # GH#13079
         with pytest.raises(TypeError):
             pd.PeriodIndex._simple_new(floats, freq='M')
 
@@ -484,6 +474,7 @@ def test_constructor_cant_cast_period(self):
                    dtype=float)
 
     def test_constructor_cast_object(self):
-        s = Series(period_range('1/1/2000', periods=10), dtype=object)
+        s = Series(period_range('1/1/2000', periods=10),
+                   dtype=PeriodDtype("D"))
         exp = Series(period_range('1/1/2000', periods=10))
         tm.assert_series_equal(s, exp)
diff --git a/pandas/tests/indexes/period/test_formats.py b/pandas/tests/indexes/period/test_formats.py
index daf44a559cf5c..2a893ae16e30d 100644
--- a/pandas/tests/indexes/period/test_formats.py
+++ b/pandas/tests/indexes/period/test_formats.py
@@ -116,41 +116,41 @@ def test_representation_to_series(self):
         idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
         idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
 
-        exp1 = """Series([], dtype: object)"""
+        exp1 = """Series([], dtype: period[D])"""
 
-        exp2 = """0   2011-01-01
-dtype: object"""
+        exp2 = """0    2011-01-01
+dtype: period[D]"""
 
-        exp3 = """0   2011-01-01
-1   2011-01-02
-dtype: object"""
+        exp3 = """0    2011-01-01
+1    2011-01-02
+dtype: period[D]"""
 
-        exp4 = """0   2011-01-01
-1   2011-01-02
-2   2011-01-03
-dtype: object"""
+        exp4 = """0    2011-01-01
+1    2011-01-02
+2    2011-01-03
+dtype: period[D]"""
 
-        exp5 = """0   2011
-1   2012
-2   2013
-dtype: object"""
+        exp5 = """0    2011
+1    2012
+2    2013
+dtype: period[A-DEC]"""
 
-        exp6 = """0   2011-01-01 09:00
-1   2012-02-01 10:00
-2                NaT
-dtype: object"""
+        exp6 = """0    2011-01-01 09:00
+1    2012-02-01 10:00
+2                 NaT
+dtype: period[H]"""
 
-        exp7 = """0   2013Q1
-dtype: object"""
+        exp7 = """0    2013Q1
+dtype: period[Q-DEC]"""
 
-        exp8 = """0   2013Q1
-1   2013Q2
-dtype: object"""
+        exp8 = """0    2013Q1
+1    2013Q2
+dtype: period[Q-DEC]"""
 
-        exp9 = """0   2013Q1
-1   2013Q2
-2   2013Q3
-dtype: object"""
+        exp9 = """0    2013Q1
+1    2013Q2
+2    2013Q3
+dtype: period[Q-DEC]"""
 
         for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
                                   idx6, idx7, idx8, idx9],
diff --git a/pandas/tests/indexes/period/test_indexing.py b/pandas/tests/indexes/period/test_indexing.py
index 60ba0491f1ffd..609c4a828adec 100644
--- a/pandas/tests/indexes/period/test_indexing.py
+++ b/pandas/tests/indexes/period/test_indexing.py
@@ -564,7 +564,7 @@ def test_get_loc2(self):
                                     'unit abbreviation w/o a number'):
             idx.get_loc('2000-01-10', method='nearest', tolerance='foo')
 
-        msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
+        msg = 'Input has different freq from PeriodArray\\(freq=D\\)'
         with tm.assert_raises_regex(ValueError, msg):
             idx.get_loc('2000-01-10', method='nearest', tolerance='1 hour')
         with pytest.raises(KeyError):
@@ -594,7 +594,7 @@ def test_get_indexer2(self):
                                                     tolerance='1 hour'),
                                     np.array([0, -1, 1], dtype=np.intp))
 
-        msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
+        msg = 'Input has different freq from PeriodArray\\(freq=H\\)'
         with tm.assert_raises_regex(ValueError, msg):
             idx.get_indexer(target, 'nearest', tolerance='1 minute')
 
diff --git a/pandas/tests/indexes/period/test_ops.py b/pandas/tests/indexes/period/test_ops.py
index a59efe57f83c4..33858a28ec81b 100644
--- a/pandas/tests/indexes/period/test_ops.py
+++ b/pandas/tests/indexes/period/test_ops.py
@@ -7,6 +7,7 @@
 import pandas.util.testing as tm
 from pandas import DatetimeIndex, PeriodIndex, Series, Period, Index
 
+from pandas.core.arrays import PeriodArray
 from pandas.tests.test_base import Ops
 
 
@@ -21,9 +22,9 @@ def setup_method(self, method):
 
     def test_ops_properties(self):
         f = lambda x: isinstance(x, PeriodIndex)
-        self.check_ops_properties(PeriodIndex._field_ops, f)
-        self.check_ops_properties(PeriodIndex._object_ops, f)
-        self.check_ops_properties(PeriodIndex._bool_ops, f)
+        self.check_ops_properties(PeriodArray._field_ops, f)
+        self.check_ops_properties(PeriodArray._object_ops, f)
+        self.check_ops_properties(PeriodArray._bool_ops, f)
 
     def test_minmax(self):
 
@@ -92,7 +93,7 @@ def test_value_counts_unique(self):
         # GH 7735
         idx = pd.period_range('2011-01-01 09:00', freq='H', periods=10)
         # create repeated values, 'n'th element is repeated by n+1 times
-        idx = PeriodIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
+        idx = PeriodIndex(np.repeat(idx._values, range(1, len(idx) + 1)),
                           freq='H')
 
         exp_idx = PeriodIndex(['2011-01-01 18:00', '2011-01-01 17:00',
@@ -390,7 +391,9 @@ def test_equals(self, freq):
         assert not idx.equals(pd.Series(idx2))
 
         # same internal, different tz
-        idx3 = pd.PeriodIndex._simple_new(idx.asi8, freq='H')
+        idx3 = pd.PeriodIndex._simple_new(
+            idx._values._simple_new(idx._values.asi8, freq="H")
+        )
         tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
         assert not idx.equals(idx3)
         assert not idx.equals(idx3.copy())
@@ -501,3 +504,12 @@ def test_pi_comp_period_nat(self):
         f = lambda x: tslib.NaT >= x
         exp = np.array([False, False, False, False], dtype=np.bool)
         self._check(idx, f, exp)
+
+
+@pytest.mark.parametrize("other", ["2017", 2017])
+def test_eq(other):
+    idx = pd.PeriodIndex(['2017', '2017', '2018'], freq="D")
+    expected = np.array([True, True, False])
+    result = idx == other
+
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/period/test_tools.py b/pandas/tests/indexes/period/test_tools.py
index a5c58eb40cc0d..a7bd2f370996b 100644
--- a/pandas/tests/indexes/period/test_tools.py
+++ b/pandas/tests/indexes/period/test_tools.py
@@ -101,6 +101,12 @@ def _get_with_delta(delta, freq='A-DEC'):
         tm.assert_index_equal(result.index, exp_index)
         assert result.name == 'foo'
 
+    def test_to_timestamp_freq(self):
+        idx = pd.period_range('2017', periods=12, freq="A-DEC")
+        result = idx.to_timestamp()
+        expected = pd.date_range("2017", periods=12, freq="AS-JAN")
+        tm.assert_index_equal(result, expected)
+
     def test_to_timestamp_repr_is_code(self):
         zs = [Timestamp('99-04-17 00:00:00', tz='UTC'),
               Timestamp('2001-04-17 00:00:00', tz='UTC'),
diff --git a/pandas/tests/io/formats/test_format.py b/pandas/tests/io/formats/test_format.py
index 03e830fb09ad6..28aa8a92cc410 100644
--- a/pandas/tests/io/formats/test_format.py
+++ b/pandas/tests/io/formats/test_format.py
@@ -1720,9 +1720,11 @@ def test_period(self):
                                  pd.Period('2011-03-01 09:00', freq='H'),
                                  pd.Period('2011-04', freq='M')],
                            'C': list('abcd')})
-        exp = ("        A                B  C\n0 2013-01          2011-01  a\n"
-               "1 2013-02       2011-02-01  b\n2 2013-03 2011-03-01 09:00  c\n"
-               "3 2013-04          2011-04  d")
+        exp = ("         A                 B  C\n"
+               "0  2013-01           2011-01  a\n"
+               "1  2013-02        2011-02-01  b\n"
+               "2  2013-03  2011-03-01 09:00  c\n"
+               "3  2013-04           2011-04  d")
         assert str(df) == exp
 
 
@@ -2110,21 +2112,31 @@ def test_period(self):
         # GH 12615
         index = pd.period_range('2013-01', periods=6, freq='M')
         s = Series(np.arange(6, dtype='int64'), index=index)
-        exp = ("2013-01    0\n2013-02    1\n2013-03    2\n2013-04    3\n"
-               "2013-05    4\n2013-06    5\nFreq: M, dtype: int64")
+        exp = ("2013-01    0\n"
+               "2013-02    1\n"
+               "2013-03    2\n"
+               "2013-04    3\n"
+               "2013-05    4\n"
+               "2013-06    5\n"
+               "Freq: M, dtype: int64")
         assert str(s) == exp
 
         s = Series(index)
-        exp = ("0   2013-01\n1   2013-02\n2   2013-03\n3   2013-04\n"
-               "4   2013-05\n5   2013-06\ndtype: object")
+        exp = ("0    2013-01\n"
+               "1    2013-02\n"
+               "2    2013-03\n"
+               "3    2013-04\n"
+               "4    2013-05\n"
+               "5    2013-06\n"
+               "dtype: period[M]")
         assert str(s) == exp
 
         # periods with mixed freq
         s = Series([pd.Period('2011-01', freq='M'),
                     pd.Period('2011-02-01', freq='D'),
                     pd.Period('2011-03-01 09:00', freq='H')])
-        exp = ("0            2011-01\n1         2011-02-01\n"
-               "2   2011-03-01 09:00\ndtype: object")
+        exp = ("0             2011-01\n1          2011-02-01\n"
+               "2    2011-03-01 09:00\ndtype: object")
         assert str(s) == exp
 
     def test_max_multi_index_display(self):
diff --git a/pandas/tests/io/test_feather.py b/pandas/tests/io/test_feather.py
index 36118fb1303fc..82f9f7253e65c 100644
--- a/pandas/tests/io/test_feather.py
+++ b/pandas/tests/io/test_feather.py
@@ -100,7 +100,8 @@ def test_unsupported_other(self):
 
         # period
         df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
-        self.check_error_on_write(df, ValueError)
+        # Some versions raise ValueError, others raise ArrowInvalid.
+        self.check_error_on_write(df, Exception)
 
     @pytest.mark.skipif(fv < LooseVersion('0.4.0'), reason='new in 0.4.0')
     def test_rw_nthreads(self):
diff --git a/pandas/tests/io/test_parquet.py b/pandas/tests/io/test_parquet.py
index c92d9a489b5c3..4c58d8ce29d8b 100644
--- a/pandas/tests/io/test_parquet.py
+++ b/pandas/tests/io/test_parquet.py
@@ -441,7 +441,9 @@ def test_duplicate_columns(self, pa):
     def test_unsupported(self, pa):
         # period
         df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
-        self.check_error_on_write(df, pa, ValueError)
+        # pyarrow 0.11 raises ArrowTypeError
+        # older pyarrows raise ArrowInvalid
+        self.check_error_on_write(df, pa, Exception)
 
         # timedelta
         df = pd.DataFrame({'a': pd.timedelta_range('1 day',
@@ -450,7 +452,9 @@ def test_unsupported(self, pa):
 
         # mixed python objects
         df = pd.DataFrame({'a': ['a', 1, 2.0]})
-        self.check_error_on_write(df, pa, ValueError)
+        # pyarrow 0.11 raises ArrowTypeError
+        # older pyarrows raise ArrowInvalid
+        self.check_error_on_write(df, pa, Exception)
 
     def test_categorical(self, pa_ge_070):
         pa = pa_ge_070
diff --git a/pandas/tests/reshape/merge/test_merge.py b/pandas/tests/reshape/merge/test_merge.py
index 50ef622a4147f..2b4a7952ae738 100644
--- a/pandas/tests/reshape/merge/test_merge.py
+++ b/pandas/tests/reshape/merge/test_merge.py
@@ -666,8 +666,8 @@ def test_merge_on_periods(self):
                               'value_y': [pd.NaT] + list(exp_y)})
         result = pd.merge(left, right, on='key', how='outer')
         assert_frame_equal(result, expected)
-        assert result['value_x'].dtype == 'object'
-        assert result['value_y'].dtype == 'object'
+        assert result['value_x'].dtype == 'Period[D]'
+        assert result['value_y'].dtype == 'Period[D]'
 
     def test_indicator(self):
         # PR #10054. xref #7412 and closes #8790.
diff --git a/pandas/tests/reshape/test_concat.py b/pandas/tests/reshape/test_concat.py
index d39c9fafe5749..e65a2e9f9d4fa 100644
--- a/pandas/tests/reshape/test_concat.py
+++ b/pandas/tests/reshape/test_concat.py
@@ -93,7 +93,7 @@ def _check_expected_dtype(self, obj, label):
                 assert obj.dtype == label
         elif isinstance(obj, pd.Series):
             if label.startswith('period'):
-                assert obj.dtype == 'object'
+                assert obj.dtype == 'Period[M]'
             else:
                 assert obj.dtype == label
         else:
@@ -1995,12 +1995,11 @@ def test_concat_NaT_dataframes(self, tz):
     def test_concat_period_series(self):
         x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
         y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='D'))
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='Period[D]')
         result = concat([x, y], ignore_index=True)
         tm.assert_series_equal(result, expected)
-        assert result.dtype == 'object'
 
-        # different freq
+    def test_concat_period_multiple_freq_series(self):
         x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
         y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='M'))
         expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
@@ -2008,6 +2007,7 @@ def test_concat_period_series(self):
         tm.assert_series_equal(result, expected)
         assert result.dtype == 'object'
 
+    def test_concat_period_other_series(self):
         x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
         y = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='M'))
         expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
diff --git a/pandas/tests/scalar/test_nat.py b/pandas/tests/scalar/test_nat.py
index bc8582d9b7d29..b978ccf4a2f6a 100644
--- a/pandas/tests/scalar/test_nat.py
+++ b/pandas/tests/scalar/test_nat.py
@@ -5,8 +5,9 @@
 
 import numpy as np
 from pandas import (NaT, Index, Timestamp, Timedelta, Period,
-                    DatetimeIndex, PeriodIndex,
+                    DatetimeIndex,
                     TimedeltaIndex, Series, isna)
+from pandas.core.arrays import PeriodArray
 from pandas.util import testing as tm
 from pandas._libs.tslib import iNaT
 
@@ -15,7 +16,7 @@
 
 @pytest.mark.parametrize('nat, idx', [(Timestamp('NaT'), DatetimeIndex),
                                       (Timedelta('NaT'), TimedeltaIndex),
-                                      (Period('NaT', freq='M'), PeriodIndex)])
+                                      (Period('NaT', freq='M'), PeriodArray)])
 def test_nat_fields(nat, idx):
 
     for field in idx._field_ops:
diff --git a/pandas/tests/series/test_api.py b/pandas/tests/series/test_api.py
index 3b82242626c20..3e68d4fc03f1f 100644
--- a/pandas/tests/series/test_api.py
+++ b/pandas/tests/series/test_api.py
@@ -14,7 +14,8 @@
 
 from pandas.compat import range, lzip, isidentifier, string_types
 from pandas import (compat, Categorical, period_range, timedelta_range,
-                    DatetimeIndex, PeriodIndex, TimedeltaIndex)
+                    DatetimeIndex, TimedeltaIndex)
+from pandas.core.arrays import PeriodArray
 import pandas.io.formats.printing as printing
 from pandas.util.testing import (assert_series_equal,
                                  ensure_clean)
@@ -698,7 +699,7 @@ def test_dt_accessor_api_for_categorical(self):
 
         test_data = [
             ("Datetime", get_ops(DatetimeIndex), s_dr, c_dr),
-            ("Period", get_ops(PeriodIndex), s_pr, c_pr),
+            ("Period", get_ops(PeriodArray), s_pr, c_pr),
             ("Timedelta", get_ops(TimedeltaIndex), s_tdr, c_tdr)]
 
         assert isinstance(c_dr.dt, Properties)
diff --git a/pandas/tests/series/test_apply.py b/pandas/tests/series/test_apply.py
index 20215279cf031..509cd8d0f3241 100644
--- a/pandas/tests/series/test_apply.py
+++ b/pandas/tests/series/test_apply.py
@@ -119,11 +119,11 @@ def test_apply_box(self):
         exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
         tm.assert_series_equal(res, exp)
 
-        # period (object dtype, not boxed)
+        # period
         vals = [pd.Period('2011-01-01', freq='M'),
                 pd.Period('2011-01-02', freq='M')]
         s = pd.Series(vals)
-        assert s.dtype == 'object'
+        assert s.dtype == 'Period[M]'
         res = s.apply(lambda x: '{0}_{1}'.format(x.__class__.__name__,
                                                  x.freqstr))
         exp = pd.Series(['Period_M', 'Period_M'])
@@ -599,11 +599,11 @@ def test_map_box(self):
         exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
         tm.assert_series_equal(res, exp)
 
-        # period (object dtype, not boxed)
+        # period
         vals = [pd.Period('2011-01-01', freq='M'),
                 pd.Period('2011-01-02', freq='M')]
         s = pd.Series(vals)
-        assert s.dtype == 'object'
+        assert s.dtype == 'Period[M]'
         res = s.map(lambda x: '{0}_{1}'.format(x.__class__.__name__,
                                                x.freqstr))
         exp = pd.Series(['Period_M', 'Period_M'])
diff --git a/pandas/tests/series/test_constructors.py b/pandas/tests/series/test_constructors.py
index 57a3f54fadbcc..83990bddcee5d 100644
--- a/pandas/tests/series/test_constructors.py
+++ b/pandas/tests/series/test_constructors.py
@@ -18,7 +18,7 @@
 from pandas import (Index, Series, isna, date_range, Timestamp,
                     NaT, period_range, timedelta_range, MultiIndex,
                     IntervalIndex, Categorical, DataFrame)
-
+from pandas.core.arrays import period_array
 from pandas._libs import lib
 from pandas._libs.tslib import iNaT
 
@@ -856,17 +856,33 @@ def test_construction_consistency(self):
         result = Series(s.values, dtype=s.dtype)
         tm.assert_series_equal(result, s)
 
+    def test_constructor_infer_period(self):
+        data = [pd.Period('2000', 'D'), pd.Period('2001', 'D'), None]
+        result = pd.Series(data)
+        expected = pd.Series(period_array(data))
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'Period[D]'
+
+        data = np.asarray(data, dtype=object)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'Period[D]'
+
+    def test_constructor_period_incompatible_frequency(self):
+        data = [pd.Period('2000', 'D'), pd.Period('2001', 'A')]
+        result = pd.Series(data)
+        assert result.dtype == object
+        assert result.tolist() == data
+
     def test_constructor_periodindex(self):
         # GH7932
         # converting a PeriodIndex when put in a Series
 
         pi = period_range('20130101', periods=5, freq='D')
         s = Series(pi)
+        assert s.dtype == 'Period[D]'
         expected = Series(pi.astype(object))
         assert_series_equal(s, expected)
 
-        assert s.dtype == 'object'
-
     def test_constructor_dict(self):
         d = {'a': 0., 'b': 1., 'c': 2.}
         result = Series(d, index=['b', 'c', 'd', 'a'])
@@ -1141,7 +1157,12 @@ def test_convert_non_ns(self):
     def test_constructor_cant_cast_datetimelike(self, index):
 
         # floats are not ok
-        msg = "Cannot cast {} to ".format(type(index).__name__)
+        msg = "Cannot cast {}.*? to ".format(
+            # strip Index to convert PeriodIndex -> Period
+            # We don't care whether the error message says
+            # PeriodIndex or PeriodArray
+            type(index).__name__.rstrip("Index")
+        )
         with tm.assert_raises_regex(TypeError, msg):
             Series(index, dtype=float)
 
diff --git a/pandas/tests/series/test_datetime_values.py b/pandas/tests/series/test_datetime_values.py
index e06d3a67db662..7f8bd375cb1a4 100644
--- a/pandas/tests/series/test_datetime_values.py
+++ b/pandas/tests/series/test_datetime_values.py
@@ -18,6 +18,7 @@
                     PeriodIndex, DatetimeIndex, TimedeltaIndex,
                     compat)
 import pandas.core.common as com
+from pandas.core.arrays import PeriodArray
 from pandas._libs.tslibs.timezones import maybe_get_tz
 
 from pandas.util.testing import assert_series_equal
@@ -31,7 +32,7 @@ def test_dt_namespace_accessor(self):
         # GH 7207, 11128
         # test .dt namespace accessor
 
-        ok_for_period = PeriodIndex._datetimelike_ops
+        ok_for_period = PeriodArray._datetimelike_ops
         ok_for_period_methods = ['strftime', 'to_timestamp', 'asfreq']
         ok_for_dt = DatetimeIndex._datetimelike_ops
         ok_for_dt_methods = ['to_period', 'to_pydatetime', 'tz_localize',
diff --git a/pandas/tests/series/test_operators.py b/pandas/tests/series/test_operators.py
index 55e3dfde3ceb7..32a687be77b95 100644
--- a/pandas/tests/series/test_operators.py
+++ b/pandas/tests/series/test_operators.py
@@ -553,8 +553,11 @@ def test_unequal_categorical_comparison_raises_type_error(self):
         ([pd.Timedelta('1 days'), NaT, pd.Timedelta('3 days')],
          [NaT, NaT, pd.Timedelta('3 days')]),
 
-        ([pd.Period('2011-01', freq='M'), NaT, pd.Period('2011-03', freq='M')],
-         [NaT, NaT, pd.Period('2011-03', freq='M')])])
+        ([pd.Period('2011-01', freq='M'), NaT,
+          pd.Period('2011-03', freq='M')],
+         [NaT, NaT, pd.Period('2011-03', freq='M')]),
+
+    ])
     @pytest.mark.parametrize('reverse', [True, False])
     @pytest.mark.parametrize('box', [Series, Index])
     @pytest.mark.parametrize('dtype', [None, object])
diff --git a/pandas/tests/series/test_period.py b/pandas/tests/series/test_period.py
index 24c2f30bef569..7a095b6dc6663 100644
--- a/pandas/tests/series/test_period.py
+++ b/pandas/tests/series/test_period.py
@@ -4,6 +4,7 @@
 import pandas as pd
 import pandas.util.testing as tm
 import pandas.core.indexes.period as period
+from pandas.core.arrays import PeriodArray
 from pandas import Series, period_range, DataFrame, Period
 
 
@@ -18,11 +19,11 @@ def setup_method(self, method):
 
     def test_auto_conversion(self):
         series = Series(list(period_range('2000-01-01', periods=10, freq='D')))
-        assert series.dtype == 'object'
+        assert series.dtype == 'Period[D]'
 
         series = pd.Series([pd.Period('2011-01-01', freq='D'),
                             pd.Period('2011-02-01', freq='D')])
-        assert series.dtype == 'object'
+        assert series.dtype == 'Period[D]'
 
     def test_getitem(self):
         assert self.series[1] == pd.Period('2000-01-02', freq='D')
@@ -30,9 +31,9 @@ def test_getitem(self):
         result = self.series[[2, 4]]
         exp = pd.Series([pd.Period('2000-01-03', freq='D'),
                          pd.Period('2000-01-05', freq='D')],
-                        index=[2, 4])
+                        index=[2, 4], dtype='Period[D]')
         tm.assert_series_equal(result, exp)
-        assert result.dtype == 'object'
+        assert result.dtype == 'Period[D]'
 
     def test_isna(self):
         # GH 13737
@@ -50,12 +51,7 @@ def test_fillna(self):
         exp = Series([pd.Period('2011-01', freq='M'),
                       pd.Period('2012-01', freq='M')])
         tm.assert_series_equal(res, exp)
-        assert res.dtype == 'object'
-
-        res = s.fillna('XXX')
-        exp = Series([pd.Period('2011-01', freq='M'), 'XXX'])
-        tm.assert_series_equal(res, exp)
-        assert res.dtype == 'object'
+        assert res.dtype == 'Period[M]'
 
     def test_dropna(self):
         # GH 13737
@@ -91,19 +87,20 @@ def test_NaT_cast(self):
         expected = Series([pd.NaT])
         tm.assert_series_equal(result, expected)
 
-    def test_set_none_nan(self):
-        # currently Period is stored as object dtype, not as NaT
+    def test_set_none(self):
         self.series[3] = None
-        assert self.series[3] is None
+        assert self.series[3] is pd.NaT
 
         self.series[3:5] = None
-        assert self.series[4] is None
+        assert self.series[4] is pd.NaT
 
+    def test_set_nan(self):
+        # Do we want to allow this?
         self.series[5] = np.nan
-        assert np.isnan(self.series[5])
+        assert self.series[5] is pd.NaT
 
         self.series[5:7] = np.nan
-        assert np.isnan(self.series[6])
+        assert self.series[6] is pd.NaT
 
     def test_intercept_astype_object(self):
         expected = self.series.astype('object')
@@ -184,6 +181,7 @@ def test_end_time_timevalues(self, input_vals):
         # GH 17157
         # Check that the time part of the Period is adjusted by end_time
         # when using the dt accessor on a Series
+        input_vals = PeriodArray._from_sequence(np.asarray(input_vals))
 
         s = Series(input_vals)
         result = s.dt.end_time
diff --git a/pandas/tests/test_base.py b/pandas/tests/test_base.py
index bbc5bd96bad55..fe2956adc35af 100644
--- a/pandas/tests/test_base.py
+++ b/pandas/tests/test_base.py
@@ -1179,11 +1179,11 @@ def test_iter_box(self):
             assert isinstance(res, Timedelta)
             assert res == exp
 
-        # period (object dtype, not boxed)
+        # period
         vals = [pd.Period('2011-01-01', freq='M'),
                 pd.Period('2011-01-02', freq='M')]
         s = Series(vals)
-        assert s.dtype == 'object'
+        assert s.dtype == 'Period[M]'
         for res, exp in zip(s, vals):
             assert isinstance(res, pd.Period)
             assert res.freq == 'M'
@@ -1198,7 +1198,8 @@ def test_iter_box(self):
     (pd.DatetimeIndex(['2017', '2018'], tz="US/Central"), pd.DatetimeIndex,
      'datetime64[ns, US/Central]'),
     (pd.TimedeltaIndex([10**10]), np.ndarray, 'm8[ns]'),
-    (pd.PeriodIndex([2018, 2019], freq='A'), np.ndarray, 'object'),
+    (pd.PeriodIndex([2018, 2019], freq='A'), pd.core.arrays.PeriodArray,
+     pd.core.dtypes.dtypes.PeriodDtype("A-DEC")),
     (pd.IntervalIndex.from_breaks([0, 1, 2]), pd.core.arrays.IntervalArray,
      'interval'),
 ])
@@ -1214,6 +1215,8 @@ def test_values_consistent(array, expected_type, dtype):
         tm.assert_index_equal(l_values, r_values)
     elif pd.api.types.is_categorical(l_values):
         tm.assert_categorical_equal(l_values, r_values)
+    elif pd.api.types.is_period_dtype(l_values):
+        tm.assert_period_array_equal(l_values, r_values)
     elif pd.api.types.is_interval_dtype(l_values):
         tm.assert_interval_array_equal(l_values, r_values)
     else:
@@ -1232,12 +1235,8 @@ def test_values_consistent(array, expected_type, dtype):
     (pd.DatetimeIndex(['2017-01-01T00:00:00'], tz="US/Eastern"),
      np.array(['2017-01-01T05:00:00'], dtype='M8[ns]')),
     (pd.TimedeltaIndex([10**10]), np.array([10**10], dtype='m8[ns]')),
-    pytest.param(
-        pd.PeriodIndex(['2017', '2018'], freq='D'),
-        np.array([17167, 17532]),
-        marks=pytest.mark.xfail(reason="PeriodArray Not implemented",
-                                strict=True)
-    ),
+    (pd.PeriodIndex(['2017', '2018'], freq='D'),
+     np.array([17167, 17532], dtype=np.int64)),
 ])
 def test_ndarray_values(array, expected):
     l_values = pd.Series(array)._ndarray_values
diff --git a/pandas/util/testing.py b/pandas/util/testing.py
index a93487a21696d..44163479dfd27 100644
--- a/pandas/util/testing.py
+++ b/pandas/util/testing.py
@@ -19,7 +19,11 @@
 import numpy as np
 
 import pandas as pd
-from pandas.core.arrays import ExtensionArray, IntervalArray
+from pandas.core.arrays import (
+    ExtensionArray,
+    IntervalArray,
+    PeriodArray,
+)
 from pandas.core.dtypes.missing import array_equivalent
 from pandas.core.dtypes.common import (
     is_datetimelike_v_numeric,
@@ -1050,6 +1054,14 @@ def assert_interval_array_equal(left, right, exact='equiv',
     assert_attr_equal('closed', left, right, obj=obj)
 
 
+def assert_period_array_equal(left, right, obj='PeriodArray'):
+    _check_isinstance(left, right, PeriodArray)
+
+    assert_numpy_array_equal(left._data, right._data,
+                             obj='{obj}.values'.format(obj=obj))
+    assert_attr_equal('freq', left, right, obj=obj)
+
+
 def raise_assert_detail(obj, message, left, right, diff=None):
     __tracebackhide__ = True
 
@@ -1543,6 +1555,10 @@ def assert_equal(left, right, **kwargs):
         assert_series_equal(left, right, **kwargs)
     elif isinstance(left, pd.DataFrame):
         assert_frame_equal(left, right, **kwargs)
+    elif isinstance(left, IntervalArray):
+        assert_interval_array_equal(left, right, **kwargs)
+    elif isinstance(left, PeriodArray):
+        assert_period_array_equal(left, right, **kwargs)
     elif isinstance(left, ExtensionArray):
         assert_extension_array_equal(left, right, **kwargs)
     elif isinstance(left, np.ndarray):

From 8da1b36d97192801ac984ffec4dc9b2d1218fef2 Mon Sep 17 00:00:00 2001
From: Krishna <prekrish2005@gmail.com>
Date: Fri, 26 Oct 2018 00:37:36 +0100
Subject: [PATCH 08/23] DOC: Added a Multi Index example for the Series.sum
 method (#23279)

---
 pandas/core/generic.py | 34 ++++++++++++++++++++++++++++++++++
 1 file changed, 34 insertions(+)

diff --git a/pandas/core/generic.py b/pandas/core/generic.py
index ceed4c3083471..a80b6df703df0 100644
--- a/pandas/core/generic.py
+++ b/pandas/core/generic.py
@@ -10185,6 +10185,40 @@ def _doc_parms(cls):
 _sum_examples = """\
 Examples
 --------
+``MultiIndex`` series example of monthly rainfall
+
+>>> index = pd.MultiIndex.from_product(
+...     [['London', 'New York'], ['Jun', 'Jul', 'Aug']],
+...     names=['city', 'month'])
+>>> s = pd.Series([47, 35, 54, 112, 117, 113], index=index)
+>>> s
+city      month
+London    Jun       47
+          Jul       35
+          Aug       54
+New York  Jun      112
+          Jul      117
+          Aug      113
+dtype: int64
+
+>>> s.sum()
+478
+
+Sum using level names, as well as indices
+
+>>> s.sum(level='city')
+city
+London      136
+New York    342
+dtype: int64
+
+>>> s.sum(level=1)
+month
+Jun    159
+Jul    152
+Aug    167
+dtype: int64
+
 By default, the sum of an empty or all-NA Series is ``0``.
 
 >>> pd.Series([]).sum()  # min_count=0 is the default

From aed5689a90209bf8748dde207a7110c1c31036b7 Mon Sep 17 00:00:00 2001
From: alimcmaster1 <alimcmaster1@gmail.com>
Date: Fri, 26 Oct 2018 00:59:29 +0100
Subject: [PATCH 09/23] isort imports-io (#23332)

Signed-off-by: alimcmaster1 <alimcmaster1@gmail.com>
---
 pandas/io/api.py             | 19 ++++++------
 pandas/io/clipboards.py      |  5 ++-
 pandas/io/common.py          | 20 ++++++------
 pandas/io/date_converters.py |  3 +-
 pandas/io/excel.py           | 42 ++++++++++++-------------
 pandas/io/feather_format.py  |  3 +-
 pandas/io/html.py            | 18 +++++------
 pandas/io/parquet.py         |  7 +++--
 pandas/io/parsers.py         | 59 ++++++++++++++++++------------------
 pandas/io/pickle.py          |  5 +--
 pandas/io/s3.py              |  1 +
 pandas/io/sas/sas_xport.py   |  9 +++---
 pandas/io/sql.py             | 26 ++++++++--------
 pandas/io/stata.py           | 20 ++++++------
 setup.cfg                    | 15 ---------
 15 files changed, 121 insertions(+), 131 deletions(-)

diff --git a/pandas/io/api.py b/pandas/io/api.py
index f542a8176dce7..496a00126de87 100644
--- a/pandas/io/api.py
+++ b/pandas/io/api.py
@@ -4,20 +4,21 @@
 
 # flake8: noqa
 
-from pandas.io.parsers import read_csv, read_table, read_fwf
 from pandas.io.clipboards import read_clipboard
 from pandas.io.excel import ExcelFile, ExcelWriter, read_excel
-from pandas.io.pytables import HDFStore, get_store, read_hdf
-from pandas.io.json import read_json
-from pandas.io.html import read_html
-from pandas.io.sql import read_sql, read_sql_table, read_sql_query
-from pandas.io.sas import read_sas
 from pandas.io.feather_format import read_feather
+from pandas.io.gbq import read_gbq
+from pandas.io.html import read_html
+from pandas.io.json import read_json
+from pandas.io.packers import read_msgpack, to_msgpack
 from pandas.io.parquet import read_parquet
-from pandas.io.stata import read_stata
+from pandas.io.parsers import read_csv, read_fwf, read_table
 from pandas.io.pickle import read_pickle, to_pickle
-from pandas.io.packers import read_msgpack, to_msgpack
-from pandas.io.gbq import read_gbq
+from pandas.io.pytables import HDFStore, get_store, read_hdf
+from pandas.io.sas import read_sas
+from pandas.io.sql import read_sql, read_sql_query, read_sql_table
+from pandas.io.stata import read_stata
+
 
 # deprecation, xref #13790
 def Term(*args, **kwargs):
diff --git a/pandas/io/clipboards.py b/pandas/io/clipboards.py
index 70c978a3b62ed..287a03c2e5728 100644
--- a/pandas/io/clipboards.py
+++ b/pandas/io/clipboards.py
@@ -1,10 +1,9 @@
 """ io on the clipboard """
 import warnings
 
-from pandas.compat import StringIO, PY2, PY3
-
-from pandas.core.dtypes.generic import ABCDataFrame
 from pandas import compat, get_option, option_context
+from pandas.compat import PY2, PY3, StringIO
+from pandas.core.dtypes.generic import ABCDataFrame
 
 
 def read_clipboard(sep=r'\s+', **kwargs):  # pragma: no cover
diff --git a/pandas/io/common.py b/pandas/io/common.py
index 2056c25ddc5f4..40247c4aebd1e 100644
--- a/pandas/io/common.py
+++ b/pandas/io/common.py
@@ -1,21 +1,21 @@
 """Common IO api utilities"""
 
-import os
-import csv
 import codecs
+import csv
 import mmap
-from contextlib import contextmanager, closing
+import os
 import zipfile
+from contextlib import closing, contextmanager
 
-from pandas.compat import StringIO, BytesIO, string_types, text_type
-from pandas import compat
-from pandas.io.formats.printing import pprint_thing
 import pandas.core.common as com
-from pandas.core.dtypes.common import is_number, is_file_like
-
+from pandas import compat
+from pandas.compat import BytesIO, StringIO, string_types, text_type
+from pandas.core.dtypes.common import is_file_like, is_number
 # compat
-from pandas.errors import (ParserError, DtypeWarning,  # noqa
-                           EmptyDataError, ParserWarning)
+from pandas.errors import (  # noqa
+    DtypeWarning, EmptyDataError, ParserError, ParserWarning
+)
+from pandas.io.formats.printing import pprint_thing
 
 # gh-12665: Alias for now and remove later.
 CParserError = ParserError
diff --git a/pandas/io/date_converters.py b/pandas/io/date_converters.py
index 377373f8a0135..1a22ee7240d59 100644
--- a/pandas/io/date_converters.py
+++ b/pandas/io/date_converters.py
@@ -1,7 +1,8 @@
 """This module is designed for community supported date conversion functions"""
-from pandas.compat import range, map
 import numpy as np
+
 from pandas._libs.tslibs import parsing
+from pandas.compat import map, range
 
 
 def parse_date_time(date_col, time_col):
diff --git a/pandas/io/excel.py b/pandas/io/excel.py
index c1cbccb7cbf1c..c6a04b9bdee20 100644
--- a/pandas/io/excel.py
+++ b/pandas/io/excel.py
@@ -2,39 +2,37 @@
 Module parse to/from Excel
 """
 
-# ---------------------------------------------------------------------
-# ExcelFile class
-from datetime import datetime, date, time, MINYEAR, timedelta
-
-import os
 import abc
+import os
 import warnings
-from textwrap import fill
-from io import UnsupportedOperation
+# ---------------------------------------------------------------------
+# ExcelFile class
+from datetime import MINYEAR, date, datetime, time, timedelta
 from distutils.version import LooseVersion
+from io import UnsupportedOperation
+from textwrap import fill
 
 import numpy as np
 
 import pandas._libs.json as json
-from pandas.util._decorators import Appender, deprecate_kwarg
-from pandas.errors import EmptyDataError
-
 import pandas.compat as compat
-from pandas.compat import (map, zip, reduce, range, lrange, u, add_metaclass,
-                           string_types, OrderedDict)
-
-from pandas.core.dtypes.common import (
-    is_integer, is_float,
-    is_bool, is_list_like)
-
+from pandas.compat import (
+    OrderedDict, add_metaclass, lrange, map, range, reduce, string_types, u,
+    zip
+)
 from pandas.core import config
+from pandas.core.dtypes.common import (
+    is_bool, is_float, is_integer, is_list_like
+)
 from pandas.core.frame import DataFrame
-
-from pandas.io.parsers import TextParser
-from pandas.io.common import (_is_url, _urlopen, _validate_header_arg,
-                              get_filepath_or_buffer, _NA_VALUES,
-                              _stringify_path)
+from pandas.errors import EmptyDataError
+from pandas.io.common import (
+    _NA_VALUES, _is_url, _stringify_path, _urlopen, _validate_header_arg,
+    get_filepath_or_buffer
+)
 from pandas.io.formats.printing import pprint_thing
+from pandas.io.parsers import TextParser
+from pandas.util._decorators import Appender, deprecate_kwarg
 
 __all__ = ["read_excel", "ExcelWriter", "ExcelFile"]
 
diff --git a/pandas/io/feather_format.py b/pandas/io/feather_format.py
index 1bc6526214a91..436c16839ffc2 100644
--- a/pandas/io/feather_format.py
+++ b/pandas/io/feather_format.py
@@ -1,7 +1,8 @@
 """ feather-format compat """
 
 from distutils.version import LooseVersion
-from pandas import DataFrame, RangeIndex, Int64Index
+
+from pandas import DataFrame, Int64Index, RangeIndex
 from pandas.compat import range
 from pandas.io.common import _stringify_path
 
diff --git a/pandas/io/html.py b/pandas/io/html.py
index 04534ff591a2c..a1d3f4589ba35 100644
--- a/pandas/io/html.py
+++ b/pandas/io/html.py
@@ -3,22 +3,22 @@
 
 """
 
+import numbers
 import os
 import re
-import numbers
-
 from distutils.version import LooseVersion
 
+import pandas.core.common as com
+from pandas import Series, compat
+from pandas.compat import (
+    binary_type, iteritems, lmap, lrange, raise_with_traceback, string_types,
+    u
+)
 from pandas.core.dtypes.common import is_list_like
 from pandas.errors import EmptyDataError
-from pandas.io.common import _is_url, urlopen, _validate_header_arg
-from pandas.io.parsers import TextParser
-from pandas import compat
-from pandas.compat import (lrange, lmap, u, string_types, iteritems,
-                           raise_with_traceback, binary_type)
-from pandas import Series
-import pandas.core.common as com
+from pandas.io.common import _is_url, _validate_header_arg, urlopen
 from pandas.io.formats.printing import pprint_thing
+from pandas.io.parsers import TextParser
 
 _IMPORTS = False
 _HAS_BS4 = False
diff --git a/pandas/io/parquet.py b/pandas/io/parquet.py
index 6ab56c68a510a..aef1d84a19bc7 100644
--- a/pandas/io/parquet.py
+++ b/pandas/io/parquet.py
@@ -1,10 +1,11 @@
 """ parquet compat """
 
-from warnings import catch_warnings
 from distutils.version import LooseVersion
-from pandas import DataFrame, RangeIndex, Int64Index, get_option
-from pandas.compat import string_types
+from warnings import catch_warnings
+
 import pandas.core.common as com
+from pandas import DataFrame, Int64Index, RangeIndex, get_option
+from pandas.compat import string_types
 from pandas.io.common import get_filepath_or_buffer, is_s3_url
 
 
diff --git a/pandas/io/parsers.py b/pandas/io/parsers.py
index eeba30ed8a44f..8dd50fceb4efb 100755
--- a/pandas/io/parsers.py
+++ b/pandas/io/parsers.py
@@ -2,50 +2,51 @@
 Module contains tools for processing files into DataFrames or other objects
 """
 from __future__ import print_function
-from collections import defaultdict
-import re
+
 import csv
+import datetime
+import re
 import sys
 import warnings
-import datetime
+from collections import defaultdict
 from textwrap import fill
 
 import numpy as np
 
+import pandas._libs.lib as lib
+import pandas._libs.ops as libops
+import pandas._libs.parsers as parsers
+import pandas.core.common as com
 from pandas import compat
-from pandas.compat import (range, lrange, PY3, StringIO, lzip,
-                           zip, string_types, map, u)
+from pandas._libs.tslibs import parsing
+from pandas.compat import (
+    PY3, StringIO, lrange, lzip, map, range, string_types, u, zip
+)
+from pandas.core import algorithms
+from pandas.core.arrays import Categorical
+from pandas.core.dtypes.cast import astype_nansafe
 from pandas.core.dtypes.common import (
-    is_integer, ensure_object,
-    is_list_like, is_integer_dtype,
-    is_float, is_dtype_equal,
-    is_object_dtype, is_string_dtype,
-    is_scalar, is_categorical_dtype)
+    ensure_object, is_categorical_dtype, is_dtype_equal, is_float, is_integer,
+    is_integer_dtype, is_list_like, is_object_dtype, is_scalar,
+    is_string_dtype
+)
 from pandas.core.dtypes.dtypes import CategoricalDtype
 from pandas.core.dtypes.missing import isna
-from pandas.core.dtypes.cast import astype_nansafe
-from pandas.core.index import (Index, MultiIndex, RangeIndex,
-                               ensure_index_from_sequences)
-from pandas.core.series import Series
 from pandas.core.frame import DataFrame
-from pandas.core.arrays import Categorical
-from pandas.core import algorithms
-import pandas.core.common as com
-from pandas.io.date_converters import generic_parser
-from pandas.errors import ParserWarning, ParserError, EmptyDataError
-from pandas.io.common import (get_filepath_or_buffer, is_file_like,
-                              _validate_header_arg, _get_handle,
-                              UnicodeReader, UTF8Recoder, _NA_VALUES,
-                              BaseIterator, _infer_compression)
+from pandas.core.index import (
+    Index, MultiIndex, RangeIndex, ensure_index_from_sequences
+)
+from pandas.core.series import Series
 from pandas.core.tools import datetimes as tools
-
+from pandas.errors import EmptyDataError, ParserError, ParserWarning
+from pandas.io.common import (
+    _NA_VALUES, BaseIterator, UnicodeReader, UTF8Recoder, _get_handle,
+    _infer_compression, _validate_header_arg, get_filepath_or_buffer,
+    is_file_like
+)
+from pandas.io.date_converters import generic_parser
 from pandas.util._decorators import Appender
 
-import pandas._libs.lib as lib
-import pandas._libs.parsers as parsers
-import pandas._libs.ops as libops
-from pandas._libs.tslibs import parsing
-
 # BOM character (byte order mark)
 # This exists at the beginning of a file to indicate endianness
 # of a file (stream). Unfortunately, this marker screws up parsing,
diff --git a/pandas/io/pickle.py b/pandas/io/pickle.py
index d52a571da0d61..4e71462f4e331 100644
--- a/pandas/io/pickle.py
+++ b/pandas/io/pickle.py
@@ -3,8 +3,9 @@
 
 import numpy as np
 from numpy.lib.format import read_array, write_array
-from pandas.compat import BytesIO, cPickle as pkl, pickle_compat as pc, PY3
-from pandas.core.dtypes.common import is_datetime64_dtype, _NS_DTYPE
+
+from pandas.compat import PY3, BytesIO, cPickle as pkl, pickle_compat as pc
+from pandas.core.dtypes.common import _NS_DTYPE, is_datetime64_dtype
 from pandas.io.common import _get_handle, _stringify_path
 
 
diff --git a/pandas/io/s3.py b/pandas/io/s3.py
index 7d1360934fd53..4998e4c0400ac 100644
--- a/pandas/io/s3.py
+++ b/pandas/io/s3.py
@@ -1,5 +1,6 @@
 """ s3 support for remote file interactivity """
 from pandas import compat
+
 try:
     import s3fs
     from botocore.exceptions import NoCredentialsError
diff --git a/pandas/io/sas/sas_xport.py b/pandas/io/sas/sas_xport.py
index 385396909a07b..c326580487b09 100644
--- a/pandas/io/sas/sas_xport.py
+++ b/pandas/io/sas/sas_xport.py
@@ -8,17 +8,16 @@
 https://support.sas.com/techsup/technote/ts140.pdf
 """
 
-from datetime import datetime
 import struct
 import warnings
+from datetime import datetime
 
 import numpy as np
 
-from pandas.util._decorators import Appender
-from pandas import compat
-
-from pandas.io.common import get_filepath_or_buffer, BaseIterator
 import pandas as pd
+from pandas import compat
+from pandas.io.common import BaseIterator, get_filepath_or_buffer
+from pandas.util._decorators import Appender
 
 _correct_line1 = ("HEADER RECORD*******LIBRARY HEADER RECORD!!!!!!!"
                   "000000000000000000000000000000  ")
diff --git a/pandas/io/sql.py b/pandas/io/sql.py
index 882fa0092b2cf..3876792d6226f 100644
--- a/pandas/io/sql.py
+++ b/pandas/io/sql.py
@@ -4,28 +4,28 @@
 retrieval and to reduce dependency on DB-specific API.
 """
 
-from __future__ import print_function, division
-from datetime import datetime, date, time
+from __future__ import division, print_function
 
-import warnings
 import re
+import warnings
+from contextlib import contextmanager
+from datetime import date, datetime, time
+
 import numpy as np
 
 import pandas._libs.lib as lib
-from pandas.core.dtypes.missing import isna
-from pandas.core.dtypes.dtypes import DatetimeTZDtype
-from pandas.core.dtypes.common import (
-    is_list_like, is_dict_like,
-    is_datetime64tz_dtype)
-
-from pandas.compat import (map, zip, raise_with_traceback,
-                           string_types, text_type)
+from pandas.compat import (
+    map, raise_with_traceback, string_types, text_type, zip
+)
 from pandas.core.api import DataFrame, Series
 from pandas.core.base import PandasObject
+from pandas.core.dtypes.common import (
+    is_datetime64tz_dtype, is_dict_like, is_list_like
+)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.missing import isna
 from pandas.core.tools.datetimes import to_datetime
 
-from contextlib import contextmanager
-
 
 class SQLAlchemyRequired(ImportError):
     pass
diff --git a/pandas/io/stata.py b/pandas/io/stata.py
index 68b2182c2ff07..00d1a92587930 100644
--- a/pandas/io/stata.py
+++ b/pandas/io/stata.py
@@ -13,27 +13,29 @@
 import datetime
 import struct
 import sys
-from collections import OrderedDict
 import warnings
+from collections import OrderedDict
 
 import numpy as np
 from dateutil.relativedelta import relativedelta
 
+from pandas import DatetimeIndex, compat, isna, to_datetime, to_timedelta
 from pandas._libs.lib import infer_dtype
 from pandas._libs.tslibs import NaT, Timestamp
 from pandas._libs.writers import max_len_string_array
-
-from pandas import compat, to_timedelta, to_datetime, isna, DatetimeIndex
-from pandas.compat import (lrange, lmap, lzip, text_type, string_types, range,
-                           zip, BytesIO)
+from pandas.compat import (
+    BytesIO, lmap, lrange, lzip, range, string_types, text_type, zip
+)
 from pandas.core.arrays import Categorical
 from pandas.core.base import StringMixin
-from pandas.core.dtypes.common import (is_categorical_dtype, ensure_object,
-                                       is_datetime64_dtype)
+from pandas.core.dtypes.common import (
+    ensure_object, is_categorical_dtype, is_datetime64_dtype
+)
 from pandas.core.frame import DataFrame
 from pandas.core.series import Series
-from pandas.io.common import (get_filepath_or_buffer, BaseIterator,
-                              _stringify_path)
+from pandas.io.common import (
+    BaseIterator, _stringify_path, get_filepath_or_buffer
+)
 from pandas.util._decorators import Appender, deprecate_kwarg
 
 _version_error = ("Version of given Stata file is not 104, 105, 108, "
diff --git a/setup.cfg b/setup.cfg
index ee39844996025..de3bd356e8f55 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -96,21 +96,6 @@ skip=
     pandas/util/_print_versions.py,
     pandas/util/_decorators.py,
     pandas/util/_test_decorators.py,
-    pandas/io/s3.py,
-    pandas/io/parquet.py,
-    pandas/io/feather_format.py,
-    pandas/io/api.py,
-    pandas/io/sql.py,
-    pandas/io/clipboards.py,
-    pandas/io/excel.py,
-    pandas/io/date_converters.py,
-    pandas/io/testing.py,
-    pandas/io/common.py,
-    pandas/io/parsers.py,
-    pandas/io/html.py,
-    pandas/io/pickle.py,
-    pandas/io/stata.py,
-    pandas/io/sas/sas_xport.py,
     pandas/io/sas/sas7bdat.py,
     pandas/io/formats/console.py,
     pandas/io/formats/excel.py,

From dae17ab9019063de50d7606da792c030eb937e77 Mon Sep 17 00:00:00 2001
From: Krishna <prekrish2005@gmail.com>
Date: Fri, 26 Oct 2018 01:14:01 +0100
Subject: [PATCH 10/23] Switched references of App veyor to azure pipelines in
 the contributing CI section (#23311)

---
 doc/source/contributing.rst | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/doc/source/contributing.rst b/doc/source/contributing.rst
index f898ef54e4101..67b8d287d5d1a 100644
--- a/doc/source/contributing.rst
+++ b/doc/source/contributing.rst
@@ -657,12 +657,12 @@ Testing With Continuous Integration
 -----------------------------------
 
 The *pandas* test suite will run automatically on `Travis-CI <https://travis-ci.org/>`__,
-`Appveyor <https://www.appveyor.com/>`__, and `Circle CI <https://circleci.com/>`__ continuous integration
-services, once your pull request is submitted.
+`Azure Pipelines <https://azure.microsoft.com/en-us/services/devops/pipelines/>`__,
+and `Circle CI <https://circleci.com/>`__ continuous integration services, once your pull request is submitted.
 However, if you wish to run the test suite on a branch prior to submitting the pull request,
 then the continuous integration services need to be hooked to your GitHub repository. Instructions are here
 for `Travis-CI <http://about.travis-ci.org/docs/user/getting-started/>`__,
-`Appveyor <https://www.appveyor.com/docs/>`__ , and `CircleCI <https://circleci.com/>`__.
+`Azure Pipelines <https://docs.microsoft.com/en-us/azure/devops/pipelines/>`__, and `CircleCI <https://circleci.com/>`__.
 
 A pull-request will be considered for merging when you have an all 'green' build. If any tests are failing,
 then you will get a red 'X', where you can click through to see the individual failed tests.
@@ -672,8 +672,8 @@ This is an example of a green build.
 
 .. note::
 
-   Each time you push to *your* fork, a *new* run of the tests will be triggered on the CI. Appveyor will auto-cancel
-   any non-currently-running tests for that same pull-request. You can enable the auto-cancel feature for
+   Each time you push to *your* fork, a *new* run of the tests will be triggered on the CI.
+   You can enable the auto-cancel feature, which removes any non-currently-running tests for that same pull-request, for
    `Travis-CI here <https://docs.travis-ci.com/user/customizing-the-build/#Building-only-the-latest-commit>`__ and
    for `CircleCI here <https://circleci.com/changelog-legacy/#option-to-auto-cancel-redundant-builds>`__.
 

From d3a7df1ff3e1f1744294a3ad9391ccd42f42fee0 Mon Sep 17 00:00:00 2001
From: Tim Swast <swast@google.com>
Date: Thu, 25 Oct 2018 17:18:56 -0700
Subject: [PATCH 11/23] TST: re-enable gbq tests (#23303)

Fix clean-up steps to use the google.cloud.bigquery client
library directly, since some of the _Dataset and _Table
logic was removed from pandas-gbq.
---
 pandas/tests/io/test_gbq.py | 43 ++++++++++++++++++++-----------------
 1 file changed, 23 insertions(+), 20 deletions(-)

diff --git a/pandas/tests/io/test_gbq.py b/pandas/tests/io/test_gbq.py
index bc604e066a3e8..345af7c8f056a 100644
--- a/pandas/tests/io/test_gbq.py
+++ b/pandas/tests/io/test_gbq.py
@@ -16,6 +16,9 @@
 import pandas.util.testing as tm
 
 
+api_exceptions = pytest.importorskip("google.api_core.exceptions")
+bigquery = pytest.importorskip("google.cloud.bigquery")
+service_account = pytest.importorskip("google.oauth2.service_account")
 pandas_gbq = pytest.importorskip('pandas_gbq')
 
 PROJECT_ID = None
@@ -67,20 +70,16 @@ def _get_private_key_path():
     return private_key_path
 
 
-def clean_gbq_environment(private_key=None):
-    dataset = pandas_gbq.gbq._Dataset(_get_project_id(),
-                                      private_key=private_key)
+def _get_client():
+    project_id = _get_project_id()
+    credentials = None
 
-    for i in range(1, 10):
-        if DATASET_ID + str(i) in dataset.datasets():
-            dataset_id = DATASET_ID + str(i)
-            table = pandas_gbq.gbq._Table(_get_project_id(), dataset_id,
-                                          private_key=private_key)
-            for j in range(1, 20):
-                if TABLE_ID + str(j) in dataset.tables(dataset_id):
-                    table.delete(TABLE_ID + str(j))
+    private_key_path = _get_private_key_path()
+    if private_key_path:
+        credentials = service_account.Credentials.from_service_account_file(
+            private_key_path)
 
-            dataset.delete(dataset_id)
+    return bigquery.Client(project=project_id, credentials=credentials)
 
 
 def make_mixed_dataframe_v2(test_size):
@@ -109,7 +108,6 @@ def test_read_gbq_without_dialect_warns_future_change(monkeypatch):
         pd.read_gbq("SELECT 1")
 
 
-@pytest.mark.xfail(reason="failing for pandas-gbq >= 0.7.0")
 @pytest.mark.single
 class TestToGBQIntegrationWithServiceAccountKeyPath(object):
 
@@ -122,18 +120,22 @@ def setup_class(cls):
         _skip_if_no_project_id()
         _skip_if_no_private_key_path()
 
-        clean_gbq_environment(_get_private_key_path())
-        pandas_gbq.gbq._Dataset(_get_project_id(),
-                                private_key=_get_private_key_path()
-                                ).create(DATASET_ID + "1")
+        cls.client = _get_client()
+        cls.dataset = cls.client.dataset(DATASET_ID + "1")
+        try:
+            # Clean-up previous test runs.
+            cls.client.delete_dataset(cls.dataset, delete_contents=True)
+        except api_exceptions.NotFound:
+            pass  # It's OK if the dataset doesn't already exist.
+
+        cls.client.create_dataset(bigquery.Dataset(cls.dataset))
 
     @classmethod
     def teardown_class(cls):
         # - GLOBAL CLASS FIXTURES -
         # put here any instruction you want to execute only *ONCE* *AFTER*
         # executing all tests.
-
-        clean_gbq_environment(_get_private_key_path())
+        cls.client.delete_dataset(cls.dataset, delete_contents=True)
 
     def test_roundtrip(self):
         destination_table = DESTINATION_TABLE + "1"
@@ -147,5 +149,6 @@ def test_roundtrip(self):
         result = pd.read_gbq("SELECT COUNT(*) AS num_rows FROM {0}"
                              .format(destination_table),
                              project_id=_get_project_id(),
-                             private_key=_get_private_key_path())
+                             private_key=_get_private_key_path(),
+                             dialect="standard")
         assert result['num_rows'][0] == test_size

From 2ff7eec0ac0208537d8f20e5cfd84e2aada36c13 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Thu, 25 Oct 2018 19:21:23 -0500
Subject: [PATCH 12/23] BUG: Handle Datetimelike data in DataFrame.combine
 (#23317)

Closes https://github.com/pandas-dev/pandas/issues/23079
---
 doc/source/whatsnew/v0.24.0.txt           |  1 +
 pandas/core/frame.py                      | 43 +++++++++++++----------
 pandas/tests/frame/test_combine_concat.py | 18 ++++++++++
 3 files changed, 43 insertions(+), 19 deletions(-)

diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index 47fef83d3015d..5fa391c3433ea 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -1012,6 +1012,7 @@ Datetimelike
 - Bug in :func:`to_datetime` with an :class:`Index` argument that would drop the ``name`` from the result (:issue:`21697`)
 - Bug in :class:`PeriodIndex` where adding or subtracting a :class:`timedelta` or :class:`Tick` object produced incorrect results (:issue:`22988`)
 - Bug in :func:`date_range` when decrementing a start date to a past end date by a negative frequency (:issue:`23270`)
+- Bug in :func:`DataFrame.combine` with datetimelike values raising a TypeError (:issue:`23079`)
 
 Timedelta
 ^^^^^^^^^
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
index 6dd9174028f18..61721ce4c82e7 100644
--- a/pandas/core/frame.py
+++ b/pandas/core/frame.py
@@ -5141,22 +5141,14 @@ def combine(self, other, func, fill_value=None, overwrite=True):
                 if not is_dtype_equal(other_dtype, new_dtype):
                     otherSeries = otherSeries.astype(new_dtype)
 
-            # see if we need to be represented as i8 (datetimelike)
-            # try to keep us at this dtype
-            needs_i8_conversion_i = needs_i8_conversion(new_dtype)
-            if needs_i8_conversion_i:
-                arr = func(series, otherSeries, True)
-            else:
-                arr = func(series, otherSeries)
-
+            arr = func(series, otherSeries)
             arr = maybe_downcast_to_dtype(arr, this_dtype)
 
             result[col] = arr
 
         # convert_objects just in case
         return self._constructor(result, index=new_index,
-                                 columns=new_columns)._convert(datetime=True,
-                                                               copy=False)
+                                 columns=new_columns)
 
     def combine_first(self, other):
         """
@@ -5203,15 +5195,28 @@ def combine_first(self, other):
         """
         import pandas.core.computation.expressions as expressions
 
-        def combiner(x, y, needs_i8_conversion=False):
-            x_values = x.values if hasattr(x, 'values') else x
-            y_values = y.values if hasattr(y, 'values') else y
-            if needs_i8_conversion:
-                mask = isna(x)
-                x_values = x_values.view('i8')
-                y_values = y_values.view('i8')
-            else:
-                mask = isna(x_values)
+        def extract_values(arr):
+            # Does two things:
+            # 1. maybe gets the values from the Series / Index
+            # 2. convert datelike to i8
+            if isinstance(arr, (ABCIndexClass, ABCSeries)):
+                arr = arr._values
+
+            if needs_i8_conversion(arr):
+                # TODO(DatetimelikeArray): just use .asi8
+                if is_extension_array_dtype(arr.dtype):
+                    arr = arr.asi8
+                else:
+                    arr = arr.view('i8')
+            return arr
+
+        def combiner(x, y):
+            mask = isna(x)
+            if isinstance(mask, (ABCIndexClass, ABCSeries)):
+                mask = mask._values
+
+            x_values = extract_values(x)
+            y_values = extract_values(y)
 
             # If the column y in other DataFrame is not in first DataFrame,
             # just return y_values.
diff --git a/pandas/tests/frame/test_combine_concat.py b/pandas/tests/frame/test_combine_concat.py
index a43c5c7257daa..2803db4f496a5 100644
--- a/pandas/tests/frame/test_combine_concat.py
+++ b/pandas/tests/frame/test_combine_concat.py
@@ -31,6 +31,24 @@ def test_concat_multiple_frames_dtypes(self):
         expected = Series(dict(float64=2, float32=2))
         assert_series_equal(results, expected)
 
+    @pytest.mark.parametrize('data', [
+        pd.date_range('2000', periods=4),
+        pd.date_range('2000', periods=4, tz="US/Central"),
+        pd.period_range('2000', periods=4),
+        pd.timedelta_range(0, periods=4),
+    ])
+    def test_combine_datetlike_udf(self, data):
+        # https://github.com/pandas-dev/pandas/issues/23079
+        df = pd.DataFrame({"A": data})
+        other = df.copy()
+        df.iloc[1, 0] = None
+
+        def combiner(a, b):
+            return b
+
+        result = df.combine(other, combiner)
+        tm.assert_frame_equal(result, other)
+
     def test_concat_multiple_tzs(self):
         # GH 12467
         # combining datetime tz-aware and naive DataFrames

From d93990e446af58df47583a77e7b831484d00e4d8 Mon Sep 17 00:00:00 2001
From: jbrockmendel <jbrockmendel@gmail.com>
Date: Thu, 25 Oct 2018 17:22:32 -0700
Subject: [PATCH 13/23] fix and test incorrect case in delta_to_nanoseconds
 (#23302)

---
 pandas/_libs/tslibs/fields.pyx         |  4 +--
 pandas/_libs/tslibs/timedeltas.pxd     |  4 +--
 pandas/_libs/tslibs/timedeltas.pyx     | 14 ++++-----
 pandas/_libs/tslibs/timezones.pyx      |  2 +-
 pandas/tests/tslibs/test_timedeltas.py | 40 ++++++++++++++++++++++++++
 5 files changed, 51 insertions(+), 13 deletions(-)
 create mode 100644 pandas/tests/tslibs/test_timedeltas.py

diff --git a/pandas/_libs/tslibs/fields.pyx b/pandas/_libs/tslibs/fields.pyx
index 684344ceb9002..1af9cd619c5f9 100644
--- a/pandas/_libs/tslibs/fields.pyx
+++ b/pandas/_libs/tslibs/fields.pyx
@@ -40,7 +40,7 @@ def get_time_micros(ndarray[int64_t] dtindex):
     return micros
 
 
-def build_field_sarray(ndarray[int64_t] dtindex):
+def build_field_sarray(int64_t[:] dtindex):
     """
     Datetime as int64 representation to a structured array of fields
     """
@@ -542,7 +542,7 @@ def get_date_field(ndarray[int64_t] dtindex, object field):
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def get_timedelta_field(ndarray[int64_t] tdindex, object field):
+def get_timedelta_field(int64_t[:] tdindex, object field):
     """
     Given a int64-based timedelta index, extract the days, hrs, sec.,
     field and return an array of these values.
diff --git a/pandas/_libs/tslibs/timedeltas.pxd b/pandas/_libs/tslibs/timedeltas.pxd
index eda4418902513..c02a840281266 100644
--- a/pandas/_libs/tslibs/timedeltas.pxd
+++ b/pandas/_libs/tslibs/timedeltas.pxd
@@ -3,8 +3,6 @@
 from numpy cimport int64_t
 
 # Exposed for tslib, not intended for outside use.
-cdef parse_timedelta_string(object ts)
-cpdef int64_t cast_from_unit(object ts, object unit) except? -1
+cdef int64_t cast_from_unit(object ts, object unit) except? -1
 cpdef int64_t delta_to_nanoseconds(delta) except? -1
 cpdef convert_to_timedelta64(object ts, object unit)
-cpdef array_to_timedelta64(object[:] values, unit=*, errors=*)
diff --git a/pandas/_libs/tslibs/timedeltas.pyx b/pandas/_libs/tslibs/timedeltas.pyx
index b5b3abd01328c..12e9208177c2d 100644
--- a/pandas/_libs/tslibs/timedeltas.pyx
+++ b/pandas/_libs/tslibs/timedeltas.pyx
@@ -119,8 +119,6 @@ def ints_to_pytimedelta(int64_t[:] arr, box=False):
 # ----------------------------------------------------------------------
 
 cpdef int64_t delta_to_nanoseconds(delta) except? -1:
-    if util.is_array(delta):
-        return delta.astype('m8[ns]').astype('int64')
     if hasattr(delta, 'nanos'):
         return delta.nanos
     if hasattr(delta, 'delta'):
@@ -129,10 +127,12 @@ cpdef int64_t delta_to_nanoseconds(delta) except? -1:
         return delta.astype("timedelta64[ns]").item()
     if is_integer_object(delta):
         return delta
+    if PyDelta_Check(delta):
+        return (delta.days * 24 * 60 * 60 * 1000000 +
+                delta.seconds * 1000000 +
+                delta.microseconds) * 1000
 
-    return (delta.days * 24 * 60 * 60 * 1000000 +
-            delta.seconds * 1000000 +
-            delta.microseconds) * 1000
+    raise TypeError(type(delta))
 
 
 cpdef convert_to_timedelta64(object ts, object unit):
@@ -198,7 +198,7 @@ cpdef convert_to_timedelta64(object ts, object unit):
     return ts.astype('timedelta64[ns]')
 
 
-cpdef array_to_timedelta64(object[:] values, unit='ns', errors='raise'):
+def array_to_timedelta64(object[:] values, unit='ns', errors='raise'):
     """
     Convert an ndarray to an array of timedeltas. If errors == 'coerce',
     coerce non-convertible objects to NaT. Otherwise, raise.
@@ -235,7 +235,7 @@ cpdef array_to_timedelta64(object[:] values, unit='ns', errors='raise'):
     return iresult.base  # .base to access underlying np.ndarray
 
 
-cpdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
+cdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
     """ return a casting of the unit represented to nanoseconds
         round the fractional part of a float to our precision, p """
     cdef:
diff --git a/pandas/_libs/tslibs/timezones.pyx b/pandas/_libs/tslibs/timezones.pyx
index b7e4de81da35c..1fc1347c8b9e3 100644
--- a/pandas/_libs/tslibs/timezones.pyx
+++ b/pandas/_libs/tslibs/timezones.pyx
@@ -322,7 +322,7 @@ cpdef bint tz_compare(object start, object end):
     return get_timezone(start) == get_timezone(end)
 
 
-cpdef tz_standardize(object tz):
+def tz_standardize(tz: object):
     """
     If the passed tz is a pytz timezone object, "normalize" it to the a
     consistent version
diff --git a/pandas/tests/tslibs/test_timedeltas.py b/pandas/tests/tslibs/test_timedeltas.py
new file mode 100644
index 0000000000000..939c2b828a75f
--- /dev/null
+++ b/pandas/tests/tslibs/test_timedeltas.py
@@ -0,0 +1,40 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds
+
+
+def test_delta_to_nanoseconds():
+    obj = np.timedelta64(14, 'D')
+    result = delta_to_nanoseconds(obj)
+    assert result == 14 * 24 * 3600 * 1e9
+
+    obj = pd.Timedelta(minutes=-7)
+    result = delta_to_nanoseconds(obj)
+    assert result == -7 * 60 * 1e9
+
+    obj = pd.Timedelta(minutes=-7).to_pytimedelta()
+    result = delta_to_nanoseconds(obj)
+    assert result == -7 * 60 * 1e9
+
+    obj = pd.offsets.Nano(125)
+    result = delta_to_nanoseconds(obj)
+    assert result == 125
+
+    obj = 1
+    result = delta_to_nanoseconds(obj)
+    assert obj == 1
+
+    obj = np.int64(2)
+    result = delta_to_nanoseconds(obj)
+    assert obj == 2
+
+    obj = np.int32(3)
+    result = delta_to_nanoseconds(obj)
+    assert result == 3
+
+    obj = np.array([123456789], dtype='m8[ns]')
+    with pytest.raises(TypeError):
+        delta_to_nanoseconds(obj)

From f79e174d07ad1f6b843c2f9fd187aff9b50d1582 Mon Sep 17 00:00:00 2001
From: topper-123 <contribute@tensortable.com>
Date: Fri, 26 Oct 2018 01:11:54 +0000
Subject: [PATCH 14/23] PERF: speed up CategoricalIndex.get_loc (#23235)

---
 asv_bench/benchmarks/indexing_engines.py      |  28 ++-
 doc/source/whatsnew/v0.24.0.txt               |   8 +-
 pandas/_libs/algos.pyx                        |  24 ++-
 pandas/_libs/algos_common_helper.pxi.in       |   3 +
 pandas/_libs/index.pyx                        |   6 +-
 pandas/_libs/index_class_helper.pxi.in        |  35 ++--
 pandas/core/indexes/category.py               |  15 +-
 pandas/tests/indexes/test_category.py         |  24 ++-
 pandas/tests/indexing/conftest.py             |  20 +++
 .../tests/indexing/test_indexing_engines.py   | 168 ++++++++++++++++++
 10 files changed, 299 insertions(+), 32 deletions(-)
 create mode 100644 pandas/tests/indexing/conftest.py
 create mode 100644 pandas/tests/indexing/test_indexing_engines.py

diff --git a/asv_bench/benchmarks/indexing_engines.py b/asv_bench/benchmarks/indexing_engines.py
index 1e9283c7fb92b..f3d063ee31bc8 100644
--- a/asv_bench/benchmarks/indexing_engines.py
+++ b/asv_bench/benchmarks/indexing_engines.py
@@ -1,18 +1,30 @@
 import numpy as np
 
-from pandas._libs.index import (Int64Engine, UInt64Engine, Float64Engine,
-                                ObjectEngine)
+from pandas._libs import index as libindex
+
+
+def _get_numeric_engines():
+    engine_names = [
+        ('Int64Engine', np.int64), ('Int32Engine', np.int32),
+        ('Int16Engine', np.int16), ('Int8Engine', np.int8),
+        ('UInt64Engine', np.uint64), ('UInt32Engine', np.uint32),
+        ('UInt16engine', np.uint16), ('UInt8Engine', np.uint8),
+        ('Float64Engine', np.float64), ('Float32Engine', np.float32),
+    ]
+    return [(getattr(libindex, engine_name), dtype)
+            for engine_name, dtype in engine_names
+            if hasattr(libindex, engine_name)]
 
 
 class NumericEngineIndexing(object):
 
-    params = [[Int64Engine, UInt64Engine, Float64Engine],
-              [np.int64, np.uint64, np.float64],
+    params = [_get_numeric_engines(),
               ['monotonic_incr', 'monotonic_decr', 'non_monotonic'],
               ]
-    param_names = ['engine', 'dtype', 'index_type']
+    param_names = ['engine_and_dtype', 'index_type']
 
-    def setup(self, engine, dtype, index_type):
+    def setup(self, engine_and_dtype, index_type):
+        engine, dtype = engine_and_dtype
         N = 10**5
         values = list([1] * N + [2] * N + [3] * N)
         arr = {
@@ -26,7 +38,7 @@ def setup(self, engine, dtype, index_type):
         # code belows avoids populating the mapping etc. while timing.
         self.data.get_loc(2)
 
-    def time_get_loc(self, engine, dtype, index_type):
+    def time_get_loc(self, engine_and_dtype, index_type):
         self.data.get_loc(2)
 
 
@@ -44,7 +56,7 @@ def setup(self, index_type):
             'non_monotonic': np.array(list('abc') * N, dtype=object),
         }[index_type]
 
-        self.data = ObjectEngine(lambda: arr, len(arr))
+        self.data = libindex.ObjectEngine(lambda: arr, len(arr))
         # code belows avoids populating the mapping etc. while timing.
         self.data.get_loc('b')
 
diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index 5fa391c3433ea..a2c89e16d0ecd 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -948,9 +948,11 @@ Removal of prior version deprecations/changes
 Performance Improvements
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-- Very large improvement in performance of slicing when the index is a :class:`CategoricalIndex`,
-  both when indexing by label (using .loc) and position(.iloc).
-  Likewise, slicing a ``CategoricalIndex`` itself (i.e. ``ci[100:200]``) shows similar speed improvements (:issue:`21659`)
+- Slicing Series and Dataframes with an monotonically increasing :class:`CategoricalIndex`
+  is now very fast and has speed comparable to slicing with an ``Int64Index``.
+  The speed increase is both when indexing by label (using .loc) and position(.iloc) (:issue:`20395`)
+  Slicing a monotonically increasing :class:`CategoricalIndex` itself (i.e. ``ci[1000:2000]``)
+  shows similar speed improvements as above (:issue:`21659`)
 - Improved performance of :func:`Series.describe` in case of numeric dtpyes (:issue:`21274`)
 - Improved performance of :func:`pandas.core.groupby.GroupBy.rank` when dealing with tied rankings (:issue:`21237`)
 - Improved performance of :func:`DataFrame.set_index` with columns consisting of :class:`Period` objects (:issue:`21582`, :issue:`21606`)
diff --git a/pandas/_libs/algos.pyx b/pandas/_libs/algos.pyx
index d2914dc8ac751..3ba4c2375b4e8 100644
--- a/pandas/_libs/algos.pyx
+++ b/pandas/_libs/algos.pyx
@@ -10,7 +10,8 @@ from libc.math cimport fabs, sqrt
 import numpy as np
 cimport numpy as cnp
 from numpy cimport (ndarray,
-                    NPY_INT64, NPY_UINT64, NPY_INT32, NPY_INT16, NPY_INT8,
+                    NPY_INT64, NPY_INT32, NPY_INT16, NPY_INT8,
+                    NPY_UINT64, NPY_UINT32, NPY_UINT16, NPY_UINT8,
                     NPY_FLOAT32, NPY_FLOAT64,
                     NPY_OBJECT,
                     int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
@@ -359,9 +360,13 @@ ctypedef fused algos_t:
     float64_t
     float32_t
     object
-    int32_t
     int64_t
+    int32_t
+    int16_t
+    int8_t
     uint64_t
+    uint32_t
+    uint16_t
     uint8_t
 
 
@@ -459,7 +464,12 @@ pad_float32 = pad["float32_t"]
 pad_object = pad["object"]
 pad_int64 = pad["int64_t"]
 pad_int32 = pad["int32_t"]
+pad_int16 = pad["int16_t"]
+pad_int8 = pad["int8_t"]
 pad_uint64 = pad["uint64_t"]
+pad_uint32 = pad["uint32_t"]
+pad_uint16 = pad["uint16_t"]
+pad_uint8 = pad["uint8_t"]
 pad_bool = pad["uint8_t"]
 
 
@@ -653,7 +663,12 @@ backfill_float32 = backfill["float32_t"]
 backfill_object = backfill["object"]
 backfill_int64 = backfill["int64_t"]
 backfill_int32 = backfill["int32_t"]
+backfill_int16 = backfill["int16_t"]
+backfill_int8 = backfill["int8_t"]
 backfill_uint64 = backfill["uint64_t"]
+backfill_uint32 = backfill["uint32_t"]
+backfill_uint16 = backfill["uint16_t"]
+backfill_uint8 = backfill["uint8_t"]
 backfill_bool = backfill["uint8_t"]
 
 
@@ -866,7 +881,12 @@ is_monotonic_float32 = is_monotonic["float32_t"]
 is_monotonic_object = is_monotonic["object"]
 is_monotonic_int64 = is_monotonic["int64_t"]
 is_monotonic_int32 = is_monotonic["int32_t"]
+is_monotonic_int16 = is_monotonic["int16_t"]
+is_monotonic_int8 = is_monotonic["int8_t"]
 is_monotonic_uint64 = is_monotonic["uint64_t"]
+is_monotonic_uint32 = is_monotonic["uint32_t"]
+is_monotonic_uint16 = is_monotonic["uint16_t"]
+is_monotonic_uint8 = is_monotonic["uint8_t"]
 is_monotonic_bool = is_monotonic["uint8_t"]
 
 
diff --git a/pandas/_libs/algos_common_helper.pxi.in b/pandas/_libs/algos_common_helper.pxi.in
index b39b5eaced8fd..518664d70cf06 100644
--- a/pandas/_libs/algos_common_helper.pxi.in
+++ b/pandas/_libs/algos_common_helper.pxi.in
@@ -133,6 +133,9 @@ dtypes = [('float64', 'FLOAT64', 'float64'),
           ('int16', 'INT16', 'int16'),
           ('int32', 'INT32', 'int32'),
           ('int64', 'INT64', 'int64'),
+          ('uint8', 'UINT8', 'uint8'),
+          ('uint16', 'UINT16', 'uint16'),
+          ('uint32', 'UINT32', 'uint32'),
           ('uint64', 'UINT64', 'uint64'),
           # ('platform_int', 'INT', 'int_'),
           # ('object', 'OBJECT', 'object_'),
diff --git a/pandas/_libs/index.pyx b/pandas/_libs/index.pyx
index 3f76915655f58..d418ac63a4ac8 100644
--- a/pandas/_libs/index.pyx
+++ b/pandas/_libs/index.pyx
@@ -5,8 +5,10 @@ import cython
 
 import numpy as np
 cimport numpy as cnp
-from numpy cimport (ndarray, float64_t, int32_t,
-                    int64_t, uint8_t, uint64_t, intp_t,
+from numpy cimport (ndarray, intp_t,
+                    float64_t, float32_t,
+                    int64_t, int32_t, int16_t, int8_t,
+                    uint64_t, uint32_t, uint16_t, uint8_t,
                     # Note: NPY_DATETIME, NPY_TIMEDELTA are only available
                     # for cimport in cython>=0.27.3
                     NPY_DATETIME, NPY_TIMEDELTA)
diff --git a/pandas/_libs/index_class_helper.pxi.in b/pandas/_libs/index_class_helper.pxi.in
index 4ea35da0626f3..c19812efaaa35 100644
--- a/pandas/_libs/index_class_helper.pxi.in
+++ b/pandas/_libs/index_class_helper.pxi.in
@@ -10,14 +10,22 @@ WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 
 {{py:
 
-# name, dtype, ctype
-dtypes = [('Float64', 'float64', 'float64_t'),
-          ('UInt64', 'uint64', 'uint64_t'),
-          ('Int64', 'int64', 'int64_t'),
-          ('Object', 'object', 'object')]
+# name, dtype, ctype, hashtable_name, hashtable_dtype
+dtypes = [('Float64', 'float64', 'float64_t', 'Float64', 'float64'),
+          ('Float32', 'float32', 'float32_t', 'Float64', 'float64'),
+          ('Int64', 'int64', 'int64_t', 'Int64', 'int64'),
+          ('Int32', 'int32', 'int32_t', 'Int64', 'int64'),
+          ('Int16', 'int16', 'int16_t', 'Int64', 'int64'),
+          ('Int8', 'int8', 'int8_t', 'Int64', 'int64'),
+          ('UInt64', 'uint64', 'uint64_t', 'UInt64', 'uint64'),
+          ('UInt32', 'uint32', 'uint32_t', 'UInt64', 'uint64'),
+          ('UInt16', 'uint16', 'uint16_t', 'UInt64', 'uint64'),
+          ('UInt8', 'uint8', 'uint8_t', 'UInt64', 'uint64'),
+          ('Object', 'object', 'object', 'PyObject', 'object'),
+          ]
 }}
 
-{{for name, dtype, ctype in dtypes}}
+{{for name, dtype, ctype, hashtable_name, hashtable_dtype in dtypes}}
 
 
 cdef class {{name}}Engine(IndexEngine):
@@ -34,13 +42,9 @@ cdef class {{name}}Engine(IndexEngine):
                                    other, limit=limit)
 
     cdef _make_hash_table(self, n):
-        {{if name == 'Object'}}
-        return _hash.PyObjectHashTable(n)
-        {{else}}
-        return _hash.{{name}}HashTable(n)
-        {{endif}}
+        return _hash.{{hashtable_name}}HashTable(n)
 
-    {{if name != 'Float64' and name != 'Object'}}
+    {{if name not in {'Float64', 'Float32', 'Object'} }}
     cdef _check_type(self, object val):
         hash(val)
         if util.is_bool_object(val):
@@ -50,6 +54,11 @@ cdef class {{name}}Engine(IndexEngine):
     {{endif}}
 
     {{if name != 'Object'}}
+    cpdef _call_map_locations(self, values):
+        # self.mapping is of type {{hashtable_name}}HashTable,
+        # so convert dtype of values
+        self.mapping.map_locations(algos.ensure_{{hashtable_dtype}}(values))
+
     cdef _get_index_values(self):
         return algos.ensure_{{dtype}}(self.vgetter())
 
@@ -60,7 +69,7 @@ cdef class {{name}}Engine(IndexEngine):
             ndarray[{{ctype}}] values
             int count = 0
 
-        {{if name != 'Float64'}}
+        {{if name not in {'Float64', 'Float32'} }}
         if not util.is_integer_object(val):
             raise KeyError(val)
         {{endif}}
diff --git a/pandas/core/indexes/category.py b/pandas/core/indexes/category.py
index e4250ae790553..278e395d65014 100644
--- a/pandas/core/indexes/category.py
+++ b/pandas/core/indexes/category.py
@@ -84,7 +84,17 @@ class CategoricalIndex(Index, accessor.PandasDelegate):
     """
 
     _typ = 'categoricalindex'
-    _engine_type = libindex.Int64Engine
+
+    @property
+    def _engine_type(self):
+        # self.codes can have dtype int8, int16, int32 or int64, so we need
+        # to return the corresponding engine type (libindex.Int8Engine, etc.).
+        return {np.int8: libindex.Int8Engine,
+                np.int16: libindex.Int16Engine,
+                np.int32: libindex.Int32Engine,
+                np.int64: libindex.Int64Engine,
+                }[self.codes.dtype.type]
+
     _attributes = ['name']
 
     def __new__(cls, data=None, categories=None, ordered=None, dtype=None,
@@ -382,7 +392,7 @@ def argsort(self, *args, **kwargs):
     def _engine(self):
 
         # we are going to look things up with the codes themselves
-        return self._engine_type(lambda: self.codes.astype('i8'), len(self))
+        return self._engine_type(lambda: self.codes, len(self))
 
     # introspection
     @cache_readonly
@@ -450,6 +460,7 @@ def get_loc(self, key, method=None):
         array([False,  True, False,  True], dtype=bool)
         """
         code = self.categories.get_loc(key)
+        code = self.codes.dtype.type(code)
         try:
             return self._engine.get_loc(code)
         except KeyError:
diff --git a/pandas/tests/indexes/test_category.py b/pandas/tests/indexes/test_category.py
index 99058f883a392..d89baa41d33fe 100644
--- a/pandas/tests/indexes/test_category.py
+++ b/pandas/tests/indexes/test_category.py
@@ -1,16 +1,16 @@
 # -*- coding: utf-8 -*-
 
 import pytest
+import numpy as np
 
 import pandas.util.testing as tm
 from pandas.core.indexes.api import Index, CategoricalIndex
 from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas._libs import index as libindex
 from .common import Base
 
 from pandas.compat import range, PY3
 
-import numpy as np
-
 from pandas import Categorical, IntervalIndex, compat
 from pandas.util.testing import assert_almost_equal
 import pandas.core.config as cf
@@ -1117,3 +1117,23 @@ def test_take_invalid_kwargs(self):
         msg = "the 'mode' parameter is not supported"
         tm.assert_raises_regex(ValueError, msg, idx.take,
                                indices, mode='clip')
+
+    @pytest.mark.parametrize('dtype, engine_type', [
+        (np.int8, libindex.Int8Engine),
+        (np.int16, libindex.Int16Engine),
+        (np.int32, libindex.Int32Engine),
+        (np.int64, libindex.Int64Engine),
+    ])
+    def test_engine_type(self, dtype, engine_type):
+        if dtype != np.int64:
+            # num. of uniques required to push CategoricalIndex.codes to a
+            # dtype (128 categories required for .codes dtype to be int16 etc.)
+            num_uniques = {np.int8: 1, np.int16: 128, np.int32: 32768}[dtype]
+            ci = pd.CategoricalIndex(range(num_uniques))
+        else:
+            # having 2**32 - 2**31 categories would be very memory-intensive,
+            # so we cheat a bit with the dtype
+            ci = pd.CategoricalIndex(range(32768))  # == 2**16 - 2**(16 - 1)
+            ci.values._codes = ci.values._codes.astype('int64')
+        assert np.issubdtype(ci.codes.dtype, dtype)
+        assert isinstance(ci._engine, engine_type)
diff --git a/pandas/tests/indexing/conftest.py b/pandas/tests/indexing/conftest.py
new file mode 100644
index 0000000000000..be1cf4800a2ef
--- /dev/null
+++ b/pandas/tests/indexing/conftest.py
@@ -0,0 +1,20 @@
+import numpy as np
+import pytest
+
+from pandas._libs import index as libindex
+
+
+@pytest.fixture(params=[
+    (libindex.Int64Engine, np.int64),
+    (libindex.Int32Engine, np.int32),
+    (libindex.Int16Engine, np.int16),
+    (libindex.Int8Engine, np.int8),
+    (libindex.UInt64Engine, np.uint64),
+    (libindex.UInt32Engine, np.uint32),
+    (libindex.UInt16Engine, np.uint16),
+    (libindex.UInt8Engine, np.uint8),
+    (libindex.Float64Engine, np.float64),
+    (libindex.Float32Engine, np.float32),
+], ids=lambda x: x[0].__name__)
+def numeric_indexing_engine_type_and_dtype(request):
+    return request.param
diff --git a/pandas/tests/indexing/test_indexing_engines.py b/pandas/tests/indexing/test_indexing_engines.py
new file mode 100644
index 0000000000000..410eba99948ce
--- /dev/null
+++ b/pandas/tests/indexing/test_indexing_engines.py
@@ -0,0 +1,168 @@
+import numpy as np
+
+import pandas.util.testing as tm
+from pandas import compat
+from pandas._libs import algos as libalgos, index as libindex
+
+
+class TestNumericEngine(object):
+    def test_is_monotonic(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+        num = 1000
+        arr = np.array([1] * num + [2] * num + [3] * num, dtype=dtype)
+
+        # monotonic increasing
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_monotonic_increasing is True
+        assert engine.is_monotonic_decreasing is False
+
+        # monotonic decreasing
+        engine = engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is True
+
+        # neither monotonic increasing or decreasing
+        arr = np.array([1] * num + [2] * num + [1] * num, dtype=dtype)
+        engine = engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is False
+
+    def test_is_unique(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        # unique
+        arr = np.array([1, 3, 2], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is True
+
+        # not unique
+        arr = np.array([1, 2, 1], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is False
+
+    def test_get_loc(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        # unique
+        arr = np.array([1, 2, 3], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.get_loc(2) == 1
+
+        # monotonic
+        num = 1000
+        arr = np.array([1] * num + [2] * num + [3] * num, dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.get_loc(2) == slice(1000, 2000)
+
+        # not monotonic
+        arr = np.array([1, 2, 3] * num, dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        expected = np.array([False, True, False] * num, dtype=bool)
+        result = engine.get_loc(2)
+        assert (result == expected).all()
+
+    def test_get_backfill_indexer(
+            self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        arr = np.array([1, 5, 10], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+
+        new = np.array(compat.range(12), dtype=dtype)
+        result = engine.get_backfill_indexer(new)
+
+        expected = libalgos.backfill(arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_pad_indexer(
+            self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        arr = np.array([1, 5, 10], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+
+        new = np.array(compat.range(12), dtype=dtype)
+        result = engine.get_pad_indexer(new)
+
+        expected = libalgos.pad(arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestObjectEngine(object):
+    engine_type = libindex.ObjectEngine
+    dtype = np.object_
+    values = list('abc')
+
+    def test_is_monotonic(self):
+
+        num = 1000
+        arr = np.array(['a'] * num + ['a'] * num + ['c'] * num,
+                       dtype=self.dtype)
+
+        # monotonic increasing
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_monotonic_increasing is True
+        assert engine.is_monotonic_decreasing is False
+
+        # monotonic decreasing
+        engine = self.engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is True
+
+        # neither monotonic increasing or decreasing
+        arr = np.array(['a'] * num + ['b'] * num + ['a'] * num,
+                       dtype=self.dtype)
+        engine = self.engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is False
+
+    def test_is_unique(self):
+        # unique
+        arr = np.array(self.values, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is True
+
+        # not unique
+        arr = np.array(['a', 'b', 'a'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is False
+
+    def test_get_loc(self):
+        # unique
+        arr = np.array(self.values, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.get_loc('b') == 1
+
+        # monotonic
+        num = 1000
+        arr = np.array(['a'] * num + ['b'] * num + ['c'] * num,
+                       dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.get_loc('b') == slice(1000, 2000)
+
+        # not monotonic
+        arr = np.array(self.values * num, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        expected = np.array([False, True, False] * num, dtype=bool)
+        result = engine.get_loc('b')
+        assert (result == expected).all()
+
+    def test_get_backfill_indexer(self):
+        arr = np.array(['a', 'e', 'j'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+
+        new = np.array(list('abcdefghij'), dtype=self.dtype)
+        result = engine.get_backfill_indexer(new)
+
+        expected = libalgos.backfill_object(arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_pad_indexer(self):
+        arr = np.array(['a', 'e', 'j'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+
+        new = np.array(list('abcdefghij'), dtype=self.dtype)
+        result = engine.get_pad_indexer(new)
+
+        expected = libalgos.pad_object(arr, new)
+        tm.assert_numpy_array_equal(result, expected)

From df4ffc7ced20abdcf20603ab01035d2283e3c01e Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Thu, 25 Oct 2018 20:28:55 -0500
Subject: [PATCH 15/23] API: Add sparse Acessor (#23183)

---
 doc/source/api.rst                       |  16 +++
 doc/source/sparse.rst                    |  20 +++
 doc/source/whatsnew/v0.24.0.txt          |   8 +-
 pandas/core/accessor.py                  |  11 +-
 pandas/core/arrays/sparse.py             | 174 +++++++++++++++++++++++
 pandas/core/indexes/accessors.py         |   1 -
 pandas/core/series.py                    |   4 +-
 pandas/core/sparse/series.py             |  93 +-----------
 pandas/tests/arrays/sparse/test_array.py |  49 +++++++
 9 files changed, 281 insertions(+), 95 deletions(-)

diff --git a/doc/source/api.rst b/doc/source/api.rst
index 1ec2a56dcd094..6e8eb83577c46 100644
--- a/doc/source/api.rst
+++ b/doc/source/api.rst
@@ -851,6 +851,22 @@ Sparse
    SparseSeries.to_coo
    SparseSeries.from_coo
 
+.. autosummary::
+   :toctree: generated/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.sparse.npoints
+   Series.sparse.density
+   Series.sparse.fill_value
+   Series.sparse.sp_values
+
+
+.. autosummary::
+   :toctree: generated/
+
+   Series.sparse.from_coo
+   Series.sparse.to_coo
+
 .. _api.dataframe:
 
 DataFrame
diff --git a/doc/source/sparse.rst b/doc/source/sparse.rst
index 2bb99dd1822b6..884512981e1c9 100644
--- a/doc/source/sparse.rst
+++ b/doc/source/sparse.rst
@@ -62,6 +62,26 @@ Any sparse object can be converted back to the standard dense form by calling
 
    sts.to_dense()
 
+.. _sparse.accessor:
+
+Sparse Accessor
+---------------
+
+.. versionadded:: 0.24.0
+
+Pandas provides a ``.sparse`` accessor, similar to ``.str`` for string data, ``.cat``
+for categorical data, and ``.dt`` for datetime-like data. This namespace provides
+attributes and methods that are specific to sparse data.
+
+.. ipython:: python
+
+   s = pd.Series([0, 0, 1, 2], dtype="Sparse[int]")
+   s.sparse.density
+   s.sparse.fill_value
+
+This accessor is available only on data with ``SparseDtype``, and on the :class:`Series`
+class itself for creating a Series with sparse data from a scipy COO matrix with.
+
 .. _sparse.array:
 
 SparseArray
diff --git a/doc/source/whatsnew/v0.24.0.txt b/doc/source/whatsnew/v0.24.0.txt
index a2c89e16d0ecd..768868d585721 100644
--- a/doc/source/whatsnew/v0.24.0.txt
+++ b/doc/source/whatsnew/v0.24.0.txt
@@ -532,7 +532,6 @@ changes were made:
 - ``SparseDataFrame.combine`` and ``DataFrame.combine_first`` no longer supports combining a sparse column with a dense column while preserving the sparse subtype. The result will be an object-dtype SparseArray.
 - Setting :attr:`SparseArray.fill_value` to a fill value with a different dtype is now allowed.
 
-
 Some new warnings are issued for operations that require or are likely to materialize a large dense array:
 
 - A :class:`errors.PerformanceWarning` is issued when using fillna with a ``method``, as a dense array is constructed to create the filled array. Filling with a ``value`` is the efficient way to fill a sparse array.
@@ -540,6 +539,13 @@ Some new warnings are issued for operations that require or are likely to materi
 
 In addition to these API breaking changes, many :ref:`performance improvements and bug fixes have been made <whatsnew_0240.bug_fixes.sparse>`.
 
+Finally, a ``Series.sparse`` accessor was added to provide sparse-specific methods like :meth:`Series.sparse.from_coo`.
+
+.. ipython:: python
+
+   s = pd.Series([0, 0, 1, 1, 1], dtype='Sparse[int]')
+   s.sparse.density
+
 .. _whatsnew_0240.api_breaking.frame_to_dict_index_orient:
 
 Raise ValueError in ``DataFrame.to_dict(orient='index')``
diff --git a/pandas/core/accessor.py b/pandas/core/accessor.py
index eab529584d1fb..bc91372e3ac7d 100644
--- a/pandas/core/accessor.py
+++ b/pandas/core/accessor.py
@@ -113,15 +113,18 @@ def delegate_names(delegate, accessors, typ, overwrite=False):
 
     Parameters
     ----------
-    delegate : the class to get methods/properties & doc-strings
-    acccessors : string list of accessors to add
-    typ : 'property' or 'method'
+    delegate : object
+        the class to get methods/properties & doc-strings
+    acccessors : Sequence[str]
+        List of accessor to add
+    typ : {'property', 'method'}
     overwrite : boolean, default False
        overwrite the method/property in the target class if it exists
 
     Returns
     -------
-    decorator
+    callable
+        A class decorator.
 
     Examples
     --------
diff --git a/pandas/core/arrays/sparse.py b/pandas/core/arrays/sparse.py
index 920a9f8286f0d..72527cfa5d12e 100644
--- a/pandas/core/arrays/sparse.py
+++ b/pandas/core/arrays/sparse.py
@@ -17,6 +17,7 @@
 from pandas.errors import PerformanceWarning
 from pandas.compat.numpy import function as nv
 
+from pandas.core.accessor import PandasDelegate, delegate_names
 from pandas.core.arrays import ExtensionArray, ExtensionOpsMixin
 import pandas.core.common as com
 from pandas.core.dtypes.base import ExtensionDtype
@@ -178,6 +179,7 @@ def _is_boolean(self):
 
     @property
     def kind(self):
+        """The sparse kind. Either 'integer', or 'block'."""
         return self.subtype.kind
 
     @property
@@ -648,10 +650,22 @@ def _from_factorized(cls, values, original):
     # ------------------------------------------------------------------------
     @property
     def sp_index(self):
+        """
+        The SparseIndex containing the location of non- ``fill_value`` points.
+        """
         return self._sparse_index
 
     @property
     def sp_values(self):
+        """
+        An ndarray containing the non- ``fill_value`` values.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 0, 2], fill_value=0)
+        >>> s.sp_values
+        array([1, 2])
+        """
         return self._sparse_values
 
     @property
@@ -704,6 +718,31 @@ def _fill_value_matches(self, fill_value):
     def nbytes(self):
         return self.sp_values.nbytes + self.sp_index.nbytes
 
+    @property
+    def density(self):
+        """The percent of non- ``fill_value`` points, as decimal.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 1, 1], fill_value=0)
+        >>> s.density
+        0.6
+        """
+        r = float(self.sp_index.npoints) / float(self.sp_index.length)
+        return r
+
+    @property
+    def npoints(self):
+        """The number of non- ``fill_value`` points.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 1, 1], fill_value=0)
+        >>> s.npoints
+        3
+        """
+        return self.sp_index.npoints
+
     @property
     def values(self):
         """
@@ -1744,3 +1783,138 @@ def _make_index(length, indices, kind):
     else:  # pragma: no cover
         raise ValueError('must be block or integer type')
     return index
+
+
+# ----------------------------------------------------------------------------
+# Accessor
+
+@delegate_names(SparseArray, ['npoints', 'density', 'fill_value',
+                              'sp_values'],
+                typ='property')
+class SparseAccessor(PandasDelegate):
+    def __init__(self, data=None):
+        self._validate(data)
+        # Store the Series since we need that for to_coo
+        self._parent = data
+
+    @staticmethod
+    def _validate(data):
+        if not isinstance(data.dtype, SparseDtype):
+            msg = "Can only use the '.sparse' accessor with Sparse data."
+            raise AttributeError(msg)
+
+    def _delegate_property_get(self, name, *args, **kwargs):
+        return getattr(self._parent.values, name)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        if name == 'from_coo':
+            return self.from_coo(*args, **kwargs)
+        elif name == 'to_coo':
+            return self.to_coo(*args, **kwargs)
+        else:
+            raise ValueError
+
+    @classmethod
+    def from_coo(cls, A, dense_index=False):
+        """
+        Create a SparseSeries from a scipy.sparse.coo_matrix.
+
+        Parameters
+        ----------
+        A : scipy.sparse.coo_matrix
+        dense_index : bool, default False
+            If False (default), the SparseSeries index consists of only the
+            coords of the non-null entries of the original coo_matrix.
+            If True, the SparseSeries index consists of the full sorted
+            (row, col) coordinates of the coo_matrix.
+
+        Returns
+        -------
+        s : SparseSeries
+
+        Examples
+        ---------
+        >>> from scipy import sparse
+        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
+                               shape=(3, 4))
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  2.],
+                [ 3.,  0.,  0.,  0.],
+                [ 0.,  0.,  0.,  0.]])
+        >>> ss = pd.SparseSeries.from_coo(A)
+        >>> ss
+        0  2    1
+           3    2
+        1  0    3
+        dtype: float64
+        BlockIndex
+        Block locations: array([0], dtype=int32)
+        Block lengths: array([3], dtype=int32)
+        """
+        from pandas.core.sparse.scipy_sparse import _coo_to_sparse_series
+        from pandas import Series
+
+        result = _coo_to_sparse_series(A, dense_index=dense_index)
+        # SparseSeries -> Series[sparse]
+        result = Series(result.values, index=result.index, copy=False)
+
+        return result
+
+    def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
+        """
+        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
+
+        Use row_levels and column_levels to determine the row and column
+        coordinates respectively. row_levels and column_levels are the names
+        (labels) or numbers of the levels. {row_levels, column_levels} must be
+        a partition of the MultiIndex level names (or numbers).
+
+        Parameters
+        ----------
+        row_levels : tuple/list
+        column_levels : tuple/list
+        sort_labels : bool, default False
+            Sort the row and column labels before forming the sparse matrix.
+
+        Returns
+        -------
+        y : scipy.sparse.coo_matrix
+        rows : list (row labels)
+        columns : list (column labels)
+
+        Examples
+        --------
+        >>> s = pd.Series([3.0, np.nan, 1.0, 3.0, np.nan, np.nan])
+        >>> s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                                (1, 2, 'a', 1),
+                                                (1, 1, 'b', 0),
+                                                (1, 1, 'b', 1),
+                                                (2, 1, 'b', 0),
+                                                (2, 1, 'b', 1)],
+                                                names=['A', 'B', 'C', 'D'])
+        >>> ss = s.to_sparse()
+        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
+                                         column_levels=['C', 'D'],
+                                         sort_labels=True)
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  3.],
+        [ 3.,  0.,  0.,  0.],
+        [ 0.,  0.,  0.,  0.]])
+        >>> rows
+        [(1, 1), (1, 2), (2, 1)]
+        >>> columns
+        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
+        """
+        from pandas.core.sparse.scipy_sparse import _sparse_series_to_coo
+
+        A, rows, columns = _sparse_series_to_coo(self._parent,
+                                                 row_levels,
+                                                 column_levels,
+                                                 sort_labels=sort_labels)
+        return A, rows, columns
diff --git a/pandas/core/indexes/accessors.py b/pandas/core/indexes/accessors.py
index 35b9799579628..c3b94c297652a 100644
--- a/pandas/core/indexes/accessors.py
+++ b/pandas/core/indexes/accessors.py
@@ -1,7 +1,6 @@
 """
 datetimelike delegation
 """
-
 import numpy as np
 
 from pandas.core.dtypes.generic import ABCSeries
diff --git a/pandas/core/series.py b/pandas/core/series.py
index d3ea005d3aae7..d813d8430d9e9 100644
--- a/pandas/core/series.py
+++ b/pandas/core/series.py
@@ -26,6 +26,7 @@
 from pandas.core.accessor import CachedAccessor
 from pandas.core.arrays import ExtensionArray, period_array
 from pandas.core.arrays.categorical import Categorical, CategoricalAccessor
+from pandas.core.arrays.sparse import SparseAccessor
 from pandas.core.config import get_option
 from pandas.core.dtypes.cast import (
     construct_1d_arraylike_from_scalar, construct_1d_ndarray_preserving_na,
@@ -142,7 +143,7 @@ class Series(base.IndexOpsMixin, generic.NDFrame):
         Copy input data
     """
     _metadata = ['name']
-    _accessors = {'dt', 'cat', 'str'}
+    _accessors = {'dt', 'cat', 'str', 'sparse'}
     _deprecations = generic.NDFrame._deprecations | frozenset(
         ['asobject', 'sortlevel', 'reshape', 'get_value', 'set_value',
          'from_csv', 'valid'])
@@ -4151,6 +4152,7 @@ def to_period(self, freq=None, copy=True):
     dt = CachedAccessor("dt", CombinedDatetimelikeProperties)
     cat = CachedAccessor("cat", CategoricalAccessor)
     plot = CachedAccessor("plot", gfx.SeriesPlotMethods)
+    sparse = CachedAccessor("sparse", SparseAccessor)
 
     # ----------------------------------------------------------------------
     # Add plotting methods to Series
diff --git a/pandas/core/sparse/series.py b/pandas/core/sparse/series.py
index 5a747c6e4b1d1..ff32712f9056a 100644
--- a/pandas/core/sparse/series.py
+++ b/pandas/core/sparse/series.py
@@ -27,6 +27,7 @@
 from pandas.core.arrays import (
     SparseArray,
 )
+from pandas.core.arrays.sparse import SparseAccessor
 from pandas._libs.sparse import BlockIndex, IntIndex
 import pandas._libs.sparse as splib
 
@@ -183,7 +184,7 @@ def sp_values(self):
 
     @property
     def npoints(self):
-        return self.sp_index.npoints
+        return self.values.npoints
 
     @classmethod
     def from_array(cls, arr, index=None, name=None, copy=False,
@@ -452,8 +453,7 @@ def to_dense(self):
 
     @property
     def density(self):
-        r = float(self.sp_index.npoints) / float(self.sp_index.length)
-        return r
+        return self.values.density
 
     def copy(self, deep=True):
         """
@@ -580,99 +580,16 @@ def combine_first(self, other):
         dense_combined = self.to_dense().combine_first(other)
         return dense_combined.to_sparse(fill_value=self.fill_value)
 
+    @Appender(SparseAccessor.to_coo.__doc__)
     def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
-        """
-        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
-
-        Use row_levels and column_levels to determine the row and column
-        coordinates respectively. row_levels and column_levels are the names
-        (labels) or numbers of the levels. {row_levels, column_levels} must be
-        a partition of the MultiIndex level names (or numbers).
-
-        Parameters
-        ----------
-        row_levels : tuple/list
-        column_levels : tuple/list
-        sort_labels : bool, default False
-            Sort the row and column labels before forming the sparse matrix.
-
-        Returns
-        -------
-        y : scipy.sparse.coo_matrix
-        rows : list (row labels)
-        columns : list (column labels)
-
-        Examples
-        --------
-        >>> s = pd.Series([3.0, np.nan, 1.0, 3.0, np.nan, np.nan])
-        >>> s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                                (1, 2, 'a', 1),
-                                                (1, 1, 'b', 0),
-                                                (1, 1, 'b', 1),
-                                                (2, 1, 'b', 0),
-                                                (2, 1, 'b', 1)],
-                                                names=['A', 'B', 'C', 'D'])
-        >>> ss = s.to_sparse()
-        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
-                                         column_levels=['C', 'D'],
-                                         sort_labels=True)
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  3.],
-        [ 3.,  0.,  0.,  0.],
-        [ 0.,  0.,  0.,  0.]])
-        >>> rows
-        [(1, 1), (1, 2), (2, 1)]
-        >>> columns
-        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
-        """
         A, rows, columns = _sparse_series_to_coo(self, row_levels,
                                                  column_levels,
                                                  sort_labels=sort_labels)
         return A, rows, columns
 
     @classmethod
+    @Appender(SparseAccessor.from_coo.__doc__)
     def from_coo(cls, A, dense_index=False):
-        """
-        Create a SparseSeries from a scipy.sparse.coo_matrix.
-
-        Parameters
-        ----------
-        A : scipy.sparse.coo_matrix
-        dense_index : bool, default False
-            If False (default), the SparseSeries index consists of only the
-            coords of the non-null entries of the original coo_matrix.
-            If True, the SparseSeries index consists of the full sorted
-            (row, col) coordinates of the coo_matrix.
-
-        Returns
-        -------
-        s : SparseSeries
-
-        Examples
-        ---------
-        >>> from scipy import sparse
-        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
-                               shape=(3, 4))
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  2.],
-                [ 3.,  0.,  0.,  0.],
-                [ 0.,  0.,  0.,  0.]])
-        >>> ss = pd.SparseSeries.from_coo(A)
-        >>> ss
-        0  2    1
-           3    2
-        1  0    3
-        dtype: float64
-        BlockIndex
-        Block locations: array([0], dtype=int32)
-        Block lengths: array([3], dtype=int32)
-        """
         return _coo_to_sparse_series(A, dense_index=dense_index)
 
 
diff --git a/pandas/tests/arrays/sparse/test_array.py b/pandas/tests/arrays/sparse/test_array.py
index e211b8626b53c..cc9512c0759fc 100644
--- a/pandas/tests/arrays/sparse/test_array.py
+++ b/pandas/tests/arrays/sparse/test_array.py
@@ -996,6 +996,55 @@ def test_asarray_datetime64(self):
         )
         np.asarray(s)
 
+    def test_density(self):
+        arr = SparseArray([0, 1])
+        assert arr.density == 0.5
+
+    def test_npoints(self):
+        arr = SparseArray([0, 1])
+        assert arr.npoints == 1
+
+
+class TestAccessor(object):
+
+    @pytest.mark.parametrize('attr', [
+        'npoints', 'density', 'fill_value', 'sp_values',
+    ])
+    def test_get_attributes(self, attr):
+        arr = SparseArray([0, 1])
+        ser = pd.Series(arr)
+
+        result = getattr(ser.sparse, attr)
+        expected = getattr(arr, attr)
+        assert result == expected
+
+    def test_from_coo(self):
+        sparse = pytest.importorskip("scipy.sparse")
+
+        row = [0, 3, 1, 0]
+        col = [0, 3, 1, 2]
+        data = [4, 5, 7, 9]
+        sp_array = sparse.coo_matrix(data, (row, col))
+        result = pd.Series.sparse.from_coo(sp_array)
+
+        index = pd.MultiIndex.from_product([[0], [0, 1, 2, 3]])
+        expected = pd.Series(data, index=index, dtype='Sparse[int]')
+        tm.assert_series_equal(result, expected)
+
+    def test_to_coo(self):
+        sparse = pytest.importorskip("scipy.sparse")
+        ser = pd.Series([1, 2, 3],
+                        index=pd.MultiIndex.from_product([[0], [1, 2, 3]],
+                                                         names=['a', 'b']),
+                        dtype='Sparse[int]')
+        A, _, _ = ser.sparse.to_coo()
+        assert isinstance(A, sparse.coo.coo_matrix)
+
+    def test_non_sparse_raises(self):
+        ser = pd.Series([1, 2, 3])
+        with tm.assert_raises_regex(AttributeError, '.sparse'):
+            ser.sparse.density
+
 
 def test_setting_fill_value_fillna_still_works():
     # This is why letting users update fill_value / dtype is bad

From 6703ace009a5a52c6be70c86e618cb3aee34a04a Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqidong1991@gmail.com>
Date: Fri, 26 Oct 2018 03:38:17 +0200
Subject: [PATCH 16/23] TST: Add base test for extensionarray setitem #23300
 (#23304)

---
 pandas/tests/extension/base/setitem.py | 49 ++++++++++++++------------
 pandas/tests/extension/conftest.py     |  6 ++++
 2 files changed, 33 insertions(+), 22 deletions(-)

diff --git a/pandas/tests/extension/base/setitem.py b/pandas/tests/extension/base/setitem.py
index 307543eca2b3e..6ebe3cb7487ab 100644
--- a/pandas/tests/extension/base/setitem.py
+++ b/pandas/tests/extension/base/setitem.py
@@ -9,18 +9,20 @@
 
 
 class BaseSetitemTests(BaseExtensionTests):
-    def test_setitem_scalar_series(self, data):
-        arr = pd.Series(data)
-        arr[0] = data[1]
-        assert arr[0] == data[1]
-
-    def test_setitem_sequence(self, data):
-        arr = pd.Series(data)
+    def test_setitem_scalar_series(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        data[0] = data[1]
+        assert data[0] == data[1]
+
+    def test_setitem_sequence(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
         original = data.copy()
 
-        arr[[0, 1]] = [data[1], data[0]]
-        assert arr[0] == original[1]
-        assert arr[1] == original[0]
+        data[[0, 1]] = [data[1], data[0]]
+        assert data[0] == original[1]
+        assert data[1] == original[0]
 
     @pytest.mark.parametrize('as_array', [True, False])
     def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
@@ -32,22 +34,25 @@ def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
         xpr = 'cannot set using a {} indexer with a different length'
         with tm.assert_raises_regex(ValueError, xpr.format('list-like')):
             ser[[0, 1]] = value
+            assert ser._values[[0, 1]] == value
 
         with tm.assert_raises_regex(ValueError, xpr.format('slice')):
             ser[slice(3)] = value
+            assert ser._values[slice(3)] == value
 
-    def test_setitem_empty_indxer(self, data):
-        ser = pd.Series(data)
-        original = ser.copy()
-        ser[[]] = []
-        self.assert_series_equal(ser, original)
-
-    def test_setitem_sequence_broadcasts(self, data):
-        arr = pd.Series(data)
-
-        arr[[0, 1]] = data[2]
-        assert arr[0] == data[2]
-        assert arr[1] == data[2]
+    def test_setitem_empty_indxer(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        original = data.copy()
+        data[np.array([], dtype=int)] = []
+        self.assert_equal(data, original)
+
+    def test_setitem_sequence_broadcasts(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        data[[0, 1]] = data[2]
+        assert data[0] == data[2]
+        assert data[1] == data[2]
 
     @pytest.mark.parametrize('setter', ['loc', 'iloc'])
     def test_setitem_scalar(self, data, setter):
diff --git a/pandas/tests/extension/conftest.py b/pandas/tests/extension/conftest.py
index 8e397d228a5b6..7758bd01840ae 100644
--- a/pandas/tests/extension/conftest.py
+++ b/pandas/tests/extension/conftest.py
@@ -98,3 +98,9 @@ def data_for_grouping():
     Where A < B < C and NA is missing
     """
     raise NotImplementedError
+
+
+@pytest.fixture(params=[True, False])
+def box_in_series(request):
+    """Whether to box the data in a Series"""
+    return request.param

From 437f31cb609372f465aaa853bf4b2299a9550716 Mon Sep 17 00:00:00 2001
From: Alexander Ponomaroff
 <33966871+alexander-ponomaroff@users.noreply.github.com>
Date: Thu, 25 Oct 2018 21:51:06 -0400
Subject: [PATCH 17/23] Partialy fix issue #23334 - isort pandas/core/groupby
 directory (#23341)

---
 pandas/core/groupby/base.py        |  3 +-
 pandas/core/groupby/categorical.py |  4 ++-
 pandas/core/groupby/generic.py     | 52 +++++++++++++-----------------
 pandas/core/groupby/groupby.py     | 38 +++++++++-------------
 pandas/core/groupby/grouper.py     | 30 +++++++----------
 pandas/core/groupby/ops.py         | 47 +++++++++++----------------
 setup.cfg                          |  6 ----
 7 files changed, 74 insertions(+), 106 deletions(-)

diff --git a/pandas/core/groupby/base.py b/pandas/core/groupby/base.py
index ac84971de08d8..9ef30b8fd021f 100644
--- a/pandas/core/groupby/base.py
+++ b/pandas/core/groupby/base.py
@@ -5,8 +5,9 @@
 """
 
 import types
+
+from pandas.core.dtypes.common import is_list_like, is_scalar
 from pandas.util._decorators import make_signature
-from pandas.core.dtypes.common import is_scalar, is_list_like
 
 
 class GroupByMixin(object):
diff --git a/pandas/core/groupby/categorical.py b/pandas/core/groupby/categorical.py
index e54045884ea93..3e653704bbace 100644
--- a/pandas/core/groupby/categorical.py
+++ b/pandas/core/groupby/categorical.py
@@ -1,7 +1,9 @@
 import numpy as np
+
 from pandas.core.algorithms import unique1d
 from pandas.core.arrays.categorical import (
-    _recode_for_categories, CategoricalDtype, Categorical)
+    Categorical, CategoricalDtype, _recode_for_categories
+)
 
 
 def recode_for_groupby(c, sort, observed):
diff --git a/pandas/core/groupby/generic.py b/pandas/core/groupby/generic.py
index 63bf67854e5cd..a832eecf87721 100644
--- a/pandas/core/groupby/generic.py
+++ b/pandas/core/groupby/generic.py
@@ -7,48 +7,40 @@
 """
 
 import collections
-import warnings
 import copy
-from textwrap import dedent
+import warnings
 from functools import partial
+from textwrap import dedent
 
 import numpy as np
 
-from pandas._libs import lib, Timestamp
-from pandas.util._decorators import Substitution, Appender
-from pandas import compat
-
-import pandas.core.indexes.base as ibase
+import pandas.core.algorithms as algorithms
 import pandas.core.common as com
-from pandas.core.panel import Panel
+import pandas.core.indexes.base as ibase
+from pandas import compat
+from pandas._libs import Timestamp, lib
 from pandas.compat import lzip, map
-
-from pandas.core.series import Series
-from pandas.core.generic import _shared_docs
-from pandas.core.groupby.groupby import (
-    GroupBy, _apply_docs, _transform_template)
-from pandas.core.generic import NDFrame
-from pandas.core.groupby import base
+from pandas.compat.numpy import _np_version_under1p13
+from pandas.core.arrays import Categorical
+from pandas.core.base import DataError, SpecificationError
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
 from pandas.core.dtypes.common import (
-    is_scalar,
-    is_bool,
-    is_datetimelike,
-    is_numeric_dtype,
-    is_integer_dtype,
-    is_interval_dtype,
-    ensure_platform_int,
-    ensure_int64)
+    ensure_int64, ensure_platform_int, is_bool, is_datetimelike,
+    is_integer_dtype, is_interval_dtype, is_numeric_dtype, is_scalar
+)
 from pandas.core.dtypes.missing import isna, notna
-import pandas.core.algorithms as algorithms
 from pandas.core.frame import DataFrame
-from pandas.core.dtypes.cast import maybe_downcast_to_dtype
-from pandas.core.base import SpecificationError, DataError
-from pandas.core.index import Index, MultiIndex, CategoricalIndex
-from pandas.core.arrays import Categorical
+from pandas.core.generic import NDFrame, _shared_docs
+from pandas.core.groupby import base
+from pandas.core.groupby.groupby import (
+    GroupBy, _apply_docs, _transform_template
+)
+from pandas.core.index import CategoricalIndex, Index, MultiIndex
 from pandas.core.internals import BlockManager, make_block
-from pandas.compat.numpy import _np_version_under1p13
-
+from pandas.core.panel import Panel
+from pandas.core.series import Series
 from pandas.plotting._core import boxplot_frame_groupby
+from pandas.util._decorators import Appender, Substitution
 
 
 class NDFrameGroupBy(GroupBy):
diff --git a/pandas/core/groupby/groupby.py b/pandas/core/groupby/groupby.py
index 025be781d9ee8..5acccbf688e30 100644
--- a/pandas/core/groupby/groupby.py
+++ b/pandas/core/groupby/groupby.py
@@ -7,42 +7,36 @@ class providing the base-class of operations.
 expose these user-facing objects to provide specific functionailty.
 """
 
-import types
-from functools import wraps, partial
-import datetime
 import collections
+import datetime
+import types
 import warnings
 from contextlib import contextmanager
+from functools import partial, wraps
 
 import numpy as np
 
-from pandas._libs import groupby as libgroupby, Timestamp
-from pandas.util._validators import validate_kwargs
-from pandas.util._decorators import (
-    cache_readonly, Substitution, Appender)
-
+import pandas.core.algorithms as algorithms
+import pandas.core.common as com
 from pandas import compat
-from pandas.compat import zip, range, callable, set_function_name
+from pandas._libs import Timestamp, groupby as libgroupby
+from pandas.compat import callable, range, set_function_name, zip
 from pandas.compat.numpy import function as nv
-
-from pandas.core.dtypes.common import (
-    is_numeric_dtype,
-    is_scalar,
-    ensure_float)
+from pandas.core.base import (
+    DataError, GroupByError, PandasObject, SelectionMixin, SpecificationError
+)
+from pandas.core.config import option_context
 from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.common import ensure_float, is_numeric_dtype, is_scalar
 from pandas.core.dtypes.missing import isna, notna
-
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame
 from pandas.core.groupby import base
-from pandas.core.base import (PandasObject, SelectionMixin, GroupByError,
-                              DataError, SpecificationError)
 from pandas.core.index import Index, MultiIndex
-from pandas.core.generic import NDFrame
-from pandas.core.frame import DataFrame
 from pandas.core.series import Series
 from pandas.core.sorting import get_group_index_sorter
-import pandas.core.common as com
-import pandas.core.algorithms as algorithms
-from pandas.core.config import option_context
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+from pandas.util._validators import validate_kwargs
 
 _doc_template = """
 
diff --git a/pandas/core/groupby/grouper.py b/pandas/core/groupby/grouper.py
index 1c8fe0e6cadad..cbe87040b8117 100644
--- a/pandas/core/groupby/grouper.py
+++ b/pandas/core/groupby/grouper.py
@@ -4,31 +4,25 @@
 """
 
 import warnings
-import numpy as np
 
-from pandas.util._decorators import cache_readonly
+import numpy as np
 
+import pandas.core.algorithms as algorithms
+import pandas.core.common as com
 from pandas import compat
-from pandas.compat import zip, callable
-
-from pandas.core.dtypes.generic import ABCSeries
-from pandas.core.arrays import ExtensionArray, Categorical
-from pandas.core.index import (
-    Index, MultiIndex, CategoricalIndex)
+from pandas.compat import callable, zip
+from pandas.core.arrays import Categorical, ExtensionArray
 from pandas.core.dtypes.common import (
-    ensure_categorical,
-    is_hashable,
-    is_list_like,
-    is_timedelta64_dtype,
-    is_datetime64_dtype,
-    is_categorical_dtype,
-    is_scalar)
-from pandas.core.series import Series
+    ensure_categorical, is_categorical_dtype, is_datetime64_dtype, is_hashable,
+    is_list_like, is_scalar, is_timedelta64_dtype
+)
+from pandas.core.dtypes.generic import ABCSeries
 from pandas.core.frame import DataFrame
-import pandas.core.common as com
 from pandas.core.groupby.ops import BaseGrouper
-import pandas.core.algorithms as algorithms
+from pandas.core.index import CategoricalIndex, Index, MultiIndex
+from pandas.core.series import Series
 from pandas.io.formats.printing import pprint_thing
+from pandas.util._decorators import cache_readonly
 
 
 class Grouper(object):
diff --git a/pandas/core/groupby/ops.py b/pandas/core/groupby/ops.py
index b199127ac867b..af22744c4feec 100644
--- a/pandas/core/groupby/ops.py
+++ b/pandas/core/groupby/ops.py
@@ -6,42 +6,33 @@
 are contained *in* the SeriesGroupBy and DataFrameGroupBy objects.
 """
 
-import copy
 import collections
-import numpy as np
-
-from pandas._libs import lib, reduction, NaT, iNaT, groupby as libgroupby
-from pandas.util._decorators import cache_readonly
+import copy
 
-from pandas.compat import zip, range, lzip
+import numpy as np
 
+import pandas.core.algorithms as algorithms
+import pandas.core.common as com
+from pandas._libs import NaT, groupby as libgroupby, iNaT, lib, reduction
+from pandas.compat import lzip, range, zip
 from pandas.core.base import SelectionMixin
-from pandas.core.dtypes.missing import isna, _maybe_fill
-from pandas.core.index import (
-    Index, MultiIndex, ensure_index)
 from pandas.core.dtypes.common import (
-    ensure_float64,
-    ensure_platform_int,
-    ensure_int64,
-    ensure_int64_or_float64,
-    ensure_object,
-    needs_i8_conversion,
-    is_integer_dtype,
-    is_complex_dtype,
-    is_bool_dtype,
-    is_numeric_dtype,
-    is_timedelta64_dtype,
-    is_datetime64_any_dtype,
-    is_categorical_dtype)
-from pandas.core.series import Series
+    ensure_float64, ensure_int64, ensure_int64_or_float64, ensure_object,
+    ensure_platform_int, is_bool_dtype, is_categorical_dtype, is_complex_dtype,
+    is_datetime64_any_dtype, is_integer_dtype, is_numeric_dtype,
+    is_timedelta64_dtype, needs_i8_conversion
+)
+from pandas.core.dtypes.missing import _maybe_fill, isna
 from pandas.core.frame import DataFrame
 from pandas.core.generic import NDFrame
-import pandas.core.common as com
 from pandas.core.groupby import base
-from pandas.core.sorting import (get_group_index_sorter, get_group_index,
-                                 compress_group_index, get_flattened_iterator,
-                                 decons_obs_group_ids, get_indexer_dict)
-import pandas.core.algorithms as algorithms
+from pandas.core.index import Index, MultiIndex, ensure_index
+from pandas.core.series import Series
+from pandas.core.sorting import (
+    compress_group_index, decons_obs_group_ids, get_flattened_iterator,
+    get_group_index, get_group_index_sorter, get_indexer_dict
+)
+from pandas.util._decorators import cache_readonly
 
 
 def generate_bins_generic(values, binner, closed):
diff --git a/setup.cfg b/setup.cfg
index de3bd356e8f55..f26eac0d2ae62 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -167,12 +167,6 @@ skip=
     pandas/core/internals/concat.py,
     pandas/core/internals/managers.py,
     pandas/core/internals/blocks.py,
-    pandas/core/groupby/ops.py,
-    pandas/core/groupby/categorical.py,
-    pandas/core/groupby/generic.py,
-    pandas/core/groupby/groupby.py,
-    pandas/core/groupby/grouper.py,
-    pandas/core/groupby/base.py,
     pandas/core/reshape/concat.py,
     pandas/core/reshape/tile.py,
     pandas/core/reshape/melt.py,

From cd16b91e5e33c2ad503492458827e5312f0d0659 Mon Sep 17 00:00:00 2001
From: Karmanya Aggarwal <CalmDownKarm@users.noreply.github.com>
Date: Fri, 26 Oct 2018 14:45:50 +0530
Subject: [PATCH 18/23] DOC: update the is_month_start/is_month_end docstring
 (#23051)

---
 pandas/core/arrays/datetimes.py | 48 ++++++++++++++++++++-------------
 1 file changed, 30 insertions(+), 18 deletions(-)

diff --git a/pandas/core/arrays/datetimes.py b/pandas/core/arrays/datetimes.py
index e269f2e02ddfd..cd20bcbed2211 100644
--- a/pandas/core/arrays/datetimes.py
+++ b/pandas/core/arrays/datetimes.py
@@ -1046,48 +1046,60 @@ def date(self):
         'dim',
         "The number of days in the month")
     daysinmonth = days_in_month
-    is_month_start = _field_accessor(
-        'is_month_start',
-        'is_month_start',
-        "Logical indicating if first day of month (defined by frequency)")
-    is_month_end = _field_accessor(
-        'is_month_end',
-        'is_month_end',
-        """
-        Indicator for whether the date is the last day of the month.
+    _is_month_doc = """
+        Indicates whether the date is the {first_or_last} day of the month.
 
         Returns
         -------
         Series or array
-            For Series, returns a Series with boolean values. For
-            DatetimeIndex, returns a boolean array.
+            For Series, returns a Series with boolean values.
+            For DatetimeIndex, returns a boolean array.
 
         See Also
         --------
-        is_month_start : Indicator for whether the date is the first day
-            of the month.
+        is_month_start : Return a boolean indicating whether the date
+            is the first day of the month.
+        is_month_end : Return a boolean indicating whether the date
+            is the last day of the month.
 
         Examples
         --------
         This method is available on Series with datetime values under
         the ``.dt`` accessor, and directly on DatetimeIndex.
 
-        >>> dates = pd.Series(pd.date_range("2018-02-27", periods=3))
-        >>> dates
+        >>> s = pd.Series(pd.date_range("2018-02-27", periods=3))
+        >>> s
         0   2018-02-27
         1   2018-02-28
         2   2018-03-01
         dtype: datetime64[ns]
-        >>> dates.dt.is_month_end
+        >>> s.dt.is_month_start
+        0    False
+        1    False
+        2    True
+        dtype: bool
+        >>> s.dt.is_month_end
         0    False
         1    True
         2    False
         dtype: bool
 
         >>> idx = pd.date_range("2018-02-27", periods=3)
+        >>> idx.is_month_start
+        array([False, False, True])
         >>> idx.is_month_end
-        array([False,  True, False], dtype=bool)
-        """)
+        array([False, True, False])
+    """
+    is_month_start = _field_accessor(
+        'is_month_start',
+        'is_month_start',
+        _is_month_doc.format(first_or_last='first'))
+
+    is_month_end = _field_accessor(
+        'is_month_end',
+        'is_month_end',
+        _is_month_doc.format(first_or_last='last'))
+
     is_quarter_start = _field_accessor(
         'is_quarter_start',
         'is_quarter_start',

From 88a57c9cc861f066abc0caa0bb902fd827b2fa97 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Fri, 26 Oct 2018 07:07:43 -0500
Subject: [PATCH 19/23] CI: Migrate some CircleCI jobs to Azure (#22992)

---
 .circleci/config.yml                          | 111 +-----------------
 .travis.yml                                   |   8 +-
 azure-pipelines.yml                           |   8 +-
 ...le-27-compat.yaml => azure-27-compat.yaml} |   0
 ...le_slow.yaml => azure-36-locale_slow.yaml} |   0
 ci/azure-37-locale.yaml                       |  35 ++++++
 ci/azure/linux.yml                            |  56 +++++++++
 ci/azure/macos.yml                            |   2 +-
 ci/circle-35-ascii.yaml                       |  15 ---
 ci/{ => circle}/install_circle.sh             |   0
 ci/{ => circle}/run_circle.sh                 |   0
 ci/{ => circle}/show_circle.sh                |   0
 ci/incremental/setup_conda_environment.sh     |   8 +-
 ci/script_multi.sh                            |  12 +-
 ci/script_single.sh                           |  12 +-
 doc/source/contributing.rst                   |   2 +-
 16 files changed, 122 insertions(+), 147 deletions(-)
 rename ci/{circle-27-compat.yaml => azure-27-compat.yaml} (100%)
 rename ci/{circle-36-locale_slow.yaml => azure-36-locale_slow.yaml} (100%)
 create mode 100644 ci/azure-37-locale.yaml
 create mode 100644 ci/azure/linux.yml
 delete mode 100644 ci/circle-35-ascii.yaml
 rename ci/{ => circle}/install_circle.sh (100%)
 rename ci/{ => circle}/run_circle.sh (100%)
 rename ci/{ => circle}/show_circle.sh (100%)

diff --git a/.circleci/config.yml b/.circleci/config.yml
index e947f30d285cd..5b10036818901 100644
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@@ -1,39 +1,6 @@
 version: 2
 jobs:
 
-  # --------------------------------------------------------------------------
-  # 0. py27_compat
-  # --------------------------------------------------------------------------
-  py27_compat:
-    docker:
-      - image: continuumio/miniconda:latest
-      # databases configuration
-      - image: circleci/postgres:9.6.5-alpine-ram
-        environment:
-            POSTGRES_USER: postgres
-            POSTGRES_DB: pandas_nosetest
-      - image: circleci/mysql:8-ram
-        environment:
-          MYSQL_USER: "root"
-          MYSQL_HOST: "localhost"
-          MYSQL_ALLOW_EMPTY_PASSWORD: "true"
-          MYSQL_DATABASE: "pandas_nosetest"
-    environment:
-      JOB: "2.7_COMPAT"
-      ENV_FILE: "ci/circle-27-compat.yaml"
-      LOCALE_OVERRIDE: "it_IT.UTF-8"
-      MINICONDA_DIR: /home/ubuntu/miniconda3
-    steps:
-      - checkout
-      - run:
-          name: build
-          command: |
-            ./ci/install_circle.sh
-            ./ci/show_circle.sh
-      - run:
-          name: test
-          command: ./ci/run_circle.sh  --skip-slow --skip-network
-
   # --------------------------------------------------------------------------
   # 1. py36_locale
   # --------------------------------------------------------------------------
@@ -62,86 +29,14 @@ jobs:
       - run:
           name: build
           command: |
-            ./ci/install_circle.sh
-            ./ci/show_circle.sh
+            ./ci/circle/install_circle.sh
+            ./ci/circle/show_circle.sh
       - run:
           name: test
-          command: ./ci/run_circle.sh  --skip-slow --skip-network
-
-  # --------------------------------------------------------------------------
-  # 2. py36_locale_slow
-  # --------------------------------------------------------------------------
-  py36_locale_slow:
-    docker:
-      - image: continuumio/miniconda:latest
-      # databases configuration
-      - image: circleci/postgres:9.6.5-alpine-ram
-        environment:
-            POSTGRES_USER: postgres
-            POSTGRES_DB: pandas_nosetest
-      - image: circleci/mysql:8-ram
-        environment:
-          MYSQL_USER: "root"
-          MYSQL_HOST: "localhost"
-          MYSQL_ALLOW_EMPTY_PASSWORD: "true"
-          MYSQL_DATABASE: "pandas_nosetest"
-
-    environment:
-      JOB: "3.6_LOCALE_SLOW"
-      ENV_FILE: "ci/circle-36-locale_slow.yaml"
-      LOCALE_OVERRIDE: "zh_CN.UTF-8"
-      MINICONDA_DIR: /home/ubuntu/miniconda3
-    steps:
-      - checkout
-      - run:
-          name: build
-          command: |
-            ./ci/install_circle.sh
-            ./ci/show_circle.sh
-      - run:
-          name: test
-          command: ./ci/run_circle.sh  --only-slow --skip-network
-
-  # --------------------------------------------------------------------------
-  # 3. py35_ascii
-  # --------------------------------------------------------------------------
-  py35_ascii:
-    docker:
-      - image: continuumio/miniconda:latest
-      # databases configuration
-      - image: circleci/postgres:9.6.5-alpine-ram
-        environment:
-            POSTGRES_USER: postgres
-            POSTGRES_DB: pandas_nosetest
-      - image: circleci/mysql:8-ram
-        environment:
-          MYSQL_USER: "root"
-          MYSQL_HOST: "localhost"
-          MYSQL_ALLOW_EMPTY_PASSWORD: "true"
-          MYSQL_DATABASE: "pandas_nosetest"
-
-    environment:
-      JOB: "3.5_ASCII"
-      ENV_FILE: "ci/circle-35-ascii.yaml"
-      LOCALE_OVERRIDE: "C"
-      MINICONDA_DIR: /home/ubuntu/miniconda3
-    steps:
-      - checkout
-      - run:
-          name: build
-          command: |
-            ./ci/install_circle.sh
-            ./ci/show_circle.sh
-      - run:
-          name: test
-          command: ./ci/run_circle.sh  --skip-slow --skip-network
-
+          command: ./ci/circle/run_circle.sh  --skip-slow --skip-network
 
 workflows:
   version: 2
   build_and_test:
     jobs:
-      - py27_compat
       - py36_locale
-      - py36_locale_slow
-      - py35_ascii
diff --git a/.travis.yml b/.travis.yml
index e8f7f3465bfd5..8ac4d827b0820 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -116,10 +116,10 @@ after_success:
 after_script:
   - echo "after_script start"
   - source activate pandas && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
-  - if [ -e /tmp/single.xml ]; then
-    ci/print_skipped.py /tmp/single.xml;
+  - if [ -e test-data-single.xml ]; then
+    ci/print_skipped.py test-data-single.xml;
     fi
-  - if [ -e /tmp/multiple.xml ]; then
-    ci/print_skipped.py /tmp/multiple.xml;
+  - if [ -e test-data-multiple.xml ]; then
+    ci/print_skipped.py test-data-multiple.xml;
     fi
   - echo "after_script done"
diff --git a/azure-pipelines.yml b/azure-pipelines.yml
index 5d473bfc5a38c..373c22fdf8e62 100644
--- a/azure-pipelines.yml
+++ b/azure-pipelines.yml
@@ -7,10 +7,10 @@ jobs:
   parameters:
     name: macOS
     vmImage: xcode9-macos10.13
-# - template: ci/azure/linux.yml
-#   parameters:
-#     name: Linux
-#     vmImage: ubuntu-16.04
+- template: ci/azure/linux.yml
+  parameters:
+    name: Linux
+    vmImage: ubuntu-16.04
 
 # Windows Python 2.7 needs VC 9.0 installed, and not sure
 # how to make that a conditional task, so for now these are
diff --git a/ci/circle-27-compat.yaml b/ci/azure-27-compat.yaml
similarity index 100%
rename from ci/circle-27-compat.yaml
rename to ci/azure-27-compat.yaml
diff --git a/ci/circle-36-locale_slow.yaml b/ci/azure-36-locale_slow.yaml
similarity index 100%
rename from ci/circle-36-locale_slow.yaml
rename to ci/azure-36-locale_slow.yaml
diff --git a/ci/azure-37-locale.yaml b/ci/azure-37-locale.yaml
new file mode 100644
index 0000000000000..ef97b85406709
--- /dev/null
+++ b/ci/azure-37-locale.yaml
@@ -0,0 +1,35 @@
+name: pandas
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython>=0.28.2
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl=2.5.5
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest
+  - pytest-xdist
+  - moto
+  - pip:
+    - hypothesis>=3.58.0
diff --git a/ci/azure/linux.yml b/ci/azure/linux.yml
new file mode 100644
index 0000000000000..f34cba69a6195
--- /dev/null
+++ b/ci/azure/linux.yml
@@ -0,0 +1,56 @@
+parameters:
+  name: ''
+  vmImage: ''
+
+jobs:
+- job: ${{ parameters.name }}
+  pool:
+    vmImage: ${{ parameters.vmImage }}
+  strategy:
+    maxParallel: 11
+    matrix:
+      py27_np_19:
+        ENV_FILE: ci/azure-27-compat.yaml
+        CONDA_PY: "27"
+        CONDA_ENV: pandas
+        TEST_ARGS: "--skip-slow --skip-network"
+
+      py36_locale:
+        ENV_FILE: ci/azure-37-locale.yaml
+        CONDA_PY: "37"
+        CONDA_ENV: pandas
+        TEST_ARGS: "--skip-slow --skip-network"
+        LOCALE_OVERRIDE: "zh_CN.UTF-8"
+
+      py36_locale_slow:
+        ENV_FILE: ci/azure-36-locale_slow.yaml
+        CONDA_PY: "36"
+        CONDA_ENV: pandas
+        TEST_ARGS: "--only-slow --skip-network"
+
+  steps:
+    - script: |
+        if [ "$(uname)" == "Linux" ]; then sudo apt-get install -y libc6-dev-i386; fi
+        echo "Installing Miniconda"{
+        ci/incremental/install_miniconda.sh
+        export PATH=$HOME/miniconda3/bin:$PATH
+        echo "Setting up Conda environment"
+        ci/incremental/setup_conda_environment.sh
+      displayName: 'Before Install'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        ci/incremental/build.sh
+      displayName: 'Build'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        ci/script_single.sh
+        ci/script_multi.sh
+        echo "[Test done]"
+      displayName: 'Test'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        source activate pandas && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
+    - task: PublishTestResults@2
+      inputs:
+        testResultsFiles: 'test-data-*.xml'
+        testRunTitle: 'Linux'
\ No newline at end of file
diff --git a/ci/azure/macos.yml b/ci/azure/macos.yml
index fb10d89731f26..53ce51c76683c 100644
--- a/ci/azure/macos.yml
+++ b/ci/azure/macos.yml
@@ -39,5 +39,5 @@ jobs:
         source activate pandas && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
     - task: PublishTestResults@2
       inputs:
-        testResultsFiles: '/tmp/*.xml'
+        testResultsFiles: 'test-data-*.xml'
         testRunTitle: 'MacOS-35'
diff --git a/ci/circle-35-ascii.yaml b/ci/circle-35-ascii.yaml
deleted file mode 100644
index 281ed59e2deff..0000000000000
--- a/ci/circle-35-ascii.yaml
+++ /dev/null
@@ -1,15 +0,0 @@
-name: pandas
-channels:
-  - defaults
-dependencies:
-  - cython>=0.28.2
-  - nomkl
-  - numpy
-  - python-dateutil
-  - python=3.5*
-  - pytz
-  # universal
-  - pytest
-  - pytest-xdist
-  - pip:
-    - hypothesis>=3.58.0
diff --git a/ci/install_circle.sh b/ci/circle/install_circle.sh
similarity index 100%
rename from ci/install_circle.sh
rename to ci/circle/install_circle.sh
diff --git a/ci/run_circle.sh b/ci/circle/run_circle.sh
similarity index 100%
rename from ci/run_circle.sh
rename to ci/circle/run_circle.sh
diff --git a/ci/show_circle.sh b/ci/circle/show_circle.sh
similarity index 100%
rename from ci/show_circle.sh
rename to ci/circle/show_circle.sh
diff --git a/ci/incremental/setup_conda_environment.sh b/ci/incremental/setup_conda_environment.sh
index c716a39138644..f3ac99d5e7c5a 100755
--- a/ci/incremental/setup_conda_environment.sh
+++ b/ci/incremental/setup_conda_environment.sh
@@ -27,13 +27,17 @@ set -v
 # w/o removing anything else
 echo
 echo "[removing installed pandas]"
-conda remove pandas -y --force
-pip uninstall -y pandas
+conda remove pandas -y --force || true
+pip uninstall -y pandas || true
 
 echo
 echo "[no installed pandas]"
 conda list pandas
 
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    sudo locale-gen "$LOCALE_OVERRIDE"
+fi
+
 # # Install the compiler toolchain
 # if [[ $(uname) == Linux ]]; then
 #     if [[ "$CONDA_SUBDIR" == "linux-32" || "$BITS32" == "yes" ]] ; then
diff --git a/ci/script_multi.sh b/ci/script_multi.sh
index dcc5a14d7b3b4..e076558e8fff3 100755
--- a/ci/script_multi.sh
+++ b/ci/script_multi.sh
@@ -27,17 +27,17 @@ if [ "$DOC" ]; then
     echo "We are not running pytest as this is a doc-build"
 
 elif [ "$COVERAGE" ]; then
-    echo pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
-    pytest      -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+    echo pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas
+    pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas
 
 elif [ "$SLOW" ]; then
     TEST_ARGS="--only-slow --skip-network"
-    echo pytest -m "not single and slow" -v --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
-    pytest      -m "not single and slow" -v --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
+    echo pytest -m "not single and slow" -v --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas
+    pytest      -m "not single and slow" -v --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas
 
 else
-    echo pytest -n 2 -m "not single" --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas
-    pytest      -n 2 -m "not single" --junitxml=/tmp/multiple.xml --strict $TEST_ARGS pandas # TODO: doctest
+    echo pytest -n 2 -m "not single" --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas
+    pytest      -n 2 -m "not single" --junitxml=test-data-multiple.xml --strict $TEST_ARGS pandas # TODO: doctest
 
 fi
 
diff --git a/ci/script_single.sh b/ci/script_single.sh
index 09e7446a2d876..42d326e0965ee 100755
--- a/ci/script_single.sh
+++ b/ci/script_single.sh
@@ -5,8 +5,9 @@ echo "[script_single]"
 source activate pandas
 
 if [ -n "$LOCALE_OVERRIDE" ]; then
+    echo "Setting LC_ALL and LANG to $LOCALE_OVERRIDE"
     export LC_ALL="$LOCALE_OVERRIDE";
-    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
+    export LANG="$LOCALE_OVERRIDE";
 
     pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
     python -c "$pycmd"
@@ -25,14 +26,13 @@ if [ "$DOC" ]; then
     echo "We are not running pytest as this is a doc-build"
 
 elif [ "$COVERAGE" ]; then
-    echo pytest -s -m "single" --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
-    pytest      -s -m "single" --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
-
+    echo pytest -s -m "single" --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=test-data-single.xml $TEST_ARGS pandas
+    pytest      -s -m "single" --strict --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=test-data-single.xml $TEST_ARGS pandas
     echo pytest -s --strict scripts
     pytest      -s --strict scripts
 else
-    echo pytest -m "single" --junitxml=/tmp/single.xml --strict $TEST_ARGS pandas
-    pytest      -m "single" --junitxml=/tmp/single.xml --strict $TEST_ARGS pandas # TODO: doctest
+    echo pytest -m "single" --junitxml=test-data-single.xml --strict $TEST_ARGS pandas
+    pytest      -m "single" --junitxml=test-data-single.xml --strict $TEST_ARGS pandas
 
 fi
 
diff --git a/doc/source/contributing.rst b/doc/source/contributing.rst
index 67b8d287d5d1a..66d545a0de6e9 100644
--- a/doc/source/contributing.rst
+++ b/doc/source/contributing.rst
@@ -684,7 +684,7 @@ Test-driven development/code writing
 ------------------------------------
 
 *pandas* is serious about testing and strongly encourages contributors to embrace
-`test-driven development (TDD) <http://en.wikipedia.org/wiki/Test-driven_development>`_.
+`test-driven development (TDD) <https://en.wikipedia.org/wiki/Test-driven_development>`_.
 This development process "relies on the repetition of a very short development cycle:
 first the developer writes an (initially failing) automated test case that defines a desired
 improvement or new function, then produces the minimum amount of code to pass that test."

From 48782a8f6de2564cff08517a3f6753734690b711 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Fri, 26 Oct 2018 07:23:40 -0500
Subject: [PATCH 20/23] REF: SparseArray imports (#23329)

---
 pandas/core/arrays/sparse.py | 76 ++++++++++++++++--------------------
 pandas/core/series.py        |  3 +-
 setup.cfg                    |  2 -
 3 files changed, 35 insertions(+), 46 deletions(-)

diff --git a/pandas/core/arrays/sparse.py b/pandas/core/arrays/sparse.py
index 72527cfa5d12e..08c961935a990 100644
--- a/pandas/core/arrays/sparse.py
+++ b/pandas/core/arrays/sparse.py
@@ -2,57 +2,47 @@
 SparseArray data structure
 """
 from __future__ import division
-# pylint: disable=E1101,E1103,W0231
 
-import re
-import operator
 import numbers
-import numpy as np
+import operator
+import re
 import warnings
 
-import pandas as pd
-from pandas.core.base import PandasObject
+import numpy as np
 
+import pandas._libs.sparse as splib
+import pandas.core.algorithms as algos
+import pandas.core.common as com
+import pandas.io.formats.printing as printing
 from pandas import compat
-from pandas.errors import PerformanceWarning
+from pandas._libs import index as libindex, lib
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas._libs.tslibs import NaT
 from pandas.compat.numpy import function as nv
-
 from pandas.core.accessor import PandasDelegate, delegate_names
 from pandas.core.arrays import ExtensionArray, ExtensionOpsMixin
-import pandas.core.common as com
+from pandas.core.base import PandasObject
 from pandas.core.dtypes.base import ExtensionDtype
+from pandas.core.dtypes.cast import (
+    astype_nansafe, construct_1d_arraylike_from_scalar, find_common_type,
+    infer_dtype_from_scalar, maybe_convert_platform
+)
+from pandas.core.dtypes.common import (
+    is_array_like, is_bool_dtype, is_datetime64_any_dtype, is_dtype_equal,
+    is_integer, is_list_like, is_object_dtype, is_scalar, is_string_dtype,
+    pandas_dtype
+)
 from pandas.core.dtypes.dtypes import register_extension_dtype
 from pandas.core.dtypes.generic import (
-    ABCSparseSeries, ABCSeries, ABCIndexClass
+    ABCIndexClass, ABCSeries, ABCSparseSeries
 )
-from pandas.core.dtypes.common import (
-    is_datetime64_any_dtype,
-    is_integer,
-    is_object_dtype,
-    is_array_like,
-    pandas_dtype,
-    is_bool_dtype,
-    is_list_like,
-    is_string_dtype,
-    is_scalar, is_dtype_equal)
-from pandas.core.dtypes.cast import (
-    maybe_convert_platform,
-    astype_nansafe, find_common_type, infer_dtype_from_scalar,
-    construct_1d_arraylike_from_scalar)
-from pandas.core.dtypes.missing import isna, notna, na_value_for_dtype
+from pandas.core.dtypes.missing import isna, na_value_for_dtype, notna
 from pandas.core.missing import interpolate_2d
-
-import pandas._libs.sparse as splib
-from pandas._libs.sparse import BlockIndex, IntIndex
-from pandas._libs import index as libindex
-from pandas._libs import lib
-import pandas.core.algorithms as algos
-import pandas.io.formats.printing as printing
+from pandas.errors import PerformanceWarning
 
 
 # ----------------------------------------------------------------------------
 # Dtype
-
 @register_extension_dtype
 class SparseDtype(ExtensionDtype):
     """
@@ -620,7 +610,7 @@ def __array__(self, dtype=None, copy=True):
             if is_datetime64_any_dtype(self.sp_values.dtype):
                 # However, we *do* special-case the common case of
                 # a datetime64 with pandas NaT.
-                if fill_value is pd.NaT:
+                if fill_value is NaT:
                     # Can't put pd.NaT in a datetime64[ns]
                     fill_value = np.datetime64('NaT')
             try:
@@ -710,7 +700,7 @@ def _null_fill_value(self):
 
     def _fill_value_matches(self, fill_value):
         if self._null_fill_value:
-            return pd.isna(fill_value)
+            return isna(fill_value)
         else:
             return self.fill_value == fill_value
 
@@ -855,7 +845,7 @@ def _first_fill_value_loc(self):
         return np.searchsorted(diff, 2) + 1
 
     def unique(self):
-        uniques = list(pd.unique(self.sp_values))
+        uniques = list(algos.unique(self.sp_values))
         fill_loc = self._first_fill_value_loc()
         if fill_loc >= 0:
             uniques.insert(fill_loc, self.fill_value)
@@ -871,8 +861,8 @@ def factorize(self, na_sentinel=-1):
         # ExtensionArray.factorize -> Tuple[EA, EA]
         # Given that we have to return a dense array of labels, why bother
         # implementing an efficient factorize?
-        labels, uniques = pd.factorize(np.asarray(self),
-                                       na_sentinel=na_sentinel)
+        labels, uniques = algos.factorize(np.asarray(self),
+                                          na_sentinel=na_sentinel)
         uniques = SparseArray(uniques, dtype=self.dtype)
         return labels, uniques
 
@@ -889,6 +879,8 @@ def value_counts(self, dropna=True):
         -------
         counts : Series
         """
+        from pandas import Index, Series
+
         keys, counts = algos._value_counts_arraylike(self.sp_values,
                                                      dropna=dropna)
         fcounts = self.sp_index.ngaps
@@ -897,7 +889,7 @@ def value_counts(self, dropna=True):
                 pass
             else:
                 if self._null_fill_value:
-                    mask = pd.isna(keys)
+                    mask = isna(keys)
                 else:
                     mask = keys == self.fill_value
 
@@ -907,9 +899,9 @@ def value_counts(self, dropna=True):
                     keys = np.insert(keys, 0, self.fill_value)
                     counts = np.insert(counts, 0, fcounts)
 
-        if not isinstance(keys, pd.Index):
-            keys = pd.Index(keys)
-        result = pd.Series(counts, index=keys)
+        if not isinstance(keys, ABCIndexClass):
+            keys = Index(keys)
+        result = Series(counts, index=keys)
         return result
 
     # --------
diff --git a/pandas/core/series.py b/pandas/core/series.py
index d813d8430d9e9..d03a88ea78f6f 100644
--- a/pandas/core/series.py
+++ b/pandas/core/series.py
@@ -24,7 +24,7 @@
 from pandas.compat.numpy import function as nv
 from pandas.core import base, generic
 from pandas.core.accessor import CachedAccessor
-from pandas.core.arrays import ExtensionArray, period_array
+from pandas.core.arrays import ExtensionArray, SparseArray, period_array
 from pandas.core.arrays.categorical import Categorical, CategoricalAccessor
 from pandas.core.arrays.sparse import SparseAccessor
 from pandas.core.config import get_option
@@ -1367,7 +1367,6 @@ def to_sparse(self, kind='block', fill_value=None):
         """
         # TODO: deprecate
         from pandas.core.sparse.series import SparseSeries
-        from pandas.core.arrays import SparseArray
 
         values = SparseArray(self, kind=kind, fill_value=fill_value)
         return SparseSeries(
diff --git a/setup.cfg b/setup.cfg
index f26eac0d2ae62..a5006d66868f6 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -175,8 +175,6 @@ skip=
     pandas/core/reshape/merge.py,
     pandas/core/reshape/reshape.py,
     pandas/core/reshape/pivot.py,
-    pandas/core/sparse/array.py,
-    pandas/core/arrays/sparse.py,
     pandas/core/sparse/api.py,
     pandas/core/sparse/series.py,
     pandas/core/sparse/frame.py,

From 5d84bc08ea7c45b0d2b3aa021a425b11531336f1 Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Fri, 26 Oct 2018 07:24:03 -0500
Subject: [PATCH 21/23] BUG: Handle Period in combine (#23350)

---
 pandas/core/dtypes/cast.py                | 8 +++++++-
 pandas/tests/frame/test_combine_concat.py | 1 -
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/pandas/core/dtypes/cast.py b/pandas/core/dtypes/cast.py
index 56bf394729773..46c8126f65fec 100644
--- a/pandas/core/dtypes/cast.py
+++ b/pandas/core/dtypes/cast.py
@@ -6,7 +6,7 @@
 import warnings
 
 from pandas._libs import tslib, lib, tslibs
-from pandas._libs.tslibs import iNaT, OutOfBoundsDatetime
+from pandas._libs.tslibs import iNaT, OutOfBoundsDatetime, Period
 from pandas.compat import string_types, text_type, PY3
 from .common import (ensure_object, is_bool, is_integer, is_float,
                      is_complex, is_datetimetz, is_categorical_dtype,
@@ -164,6 +164,12 @@ def trans(x):  # noqa
                     result = to_datetime(result).tz_localize('utc')
                     result = result.tz_convert(dtype.tz)
 
+        elif dtype.type == Period:
+            # TODO(DatetimeArray): merge with previous elif
+            from pandas.core.arrays import PeriodArray
+
+            return PeriodArray(result, freq=dtype.freq)
+
     except Exception:
         pass
 
diff --git a/pandas/tests/frame/test_combine_concat.py b/pandas/tests/frame/test_combine_concat.py
index 2803db4f496a5..3b8d6e6c55ed1 100644
--- a/pandas/tests/frame/test_combine_concat.py
+++ b/pandas/tests/frame/test_combine_concat.py
@@ -759,7 +759,6 @@ def test_combine_first_timedelta(self):
         tm.assert_frame_equal(res, exp)
         assert res['TD'].dtype == 'timedelta64[ns]'
 
-    @pytest.mark.xfail(reason="GH-23079", strict=True)
     def test_combine_first_period(self):
         data1 = pd.PeriodIndex(['2011-01', 'NaT', '2011-03',
                                 '2011-04'], freq='M')

From caea25a8b91d62b30eef99aa0c523448e19cd6db Mon Sep 17 00:00:00 2001
From: Tom Augspurger <TomAugspurger@users.noreply.github.com>
Date: Fri, 26 Oct 2018 07:24:38 -0500
Subject: [PATCH 22/23] TST: Fix test assertion (#23357)

---
 pandas/tests/extension/base/setitem.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/pandas/tests/extension/base/setitem.py b/pandas/tests/extension/base/setitem.py
index 6ebe3cb7487ab..029a77acb121f 100644
--- a/pandas/tests/extension/base/setitem.py
+++ b/pandas/tests/extension/base/setitem.py
@@ -27,6 +27,7 @@ def test_setitem_sequence(self, data, box_in_series):
     @pytest.mark.parametrize('as_array', [True, False])
     def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
         ser = pd.Series(data)
+        original = ser.copy()
         value = [data[0]]
         if as_array:
             value = data._from_sequence(value)
@@ -34,11 +35,12 @@ def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
         xpr = 'cannot set using a {} indexer with a different length'
         with tm.assert_raises_regex(ValueError, xpr.format('list-like')):
             ser[[0, 1]] = value
-            assert ser._values[[0, 1]] == value
+        # Ensure no modifications made before the exception
+        self.assert_series_equal(ser, original)
 
         with tm.assert_raises_regex(ValueError, xpr.format('slice')):
             ser[slice(3)] = value
-            assert ser._values[slice(3)] == value
+        self.assert_series_equal(ser, original)
 
     def test_setitem_empty_indxer(self, data, box_in_series):
         if box_in_series:

From f662c5f2a7b392ee96a43f055073c8523f8f0339 Mon Sep 17 00:00:00 2001
From: Allison Browne <getschomp@users.noreply.github.com>
Date: Fri, 26 Oct 2018 17:23:21 -0400
Subject: [PATCH 23/23] DOC: Add docstring validations for "See Also" section
 (#23143)

---
 scripts/tests/test_validate_docstrings.py | 32 +++++++++++++++++++++++
 scripts/validate_docstrings.py            |  9 ++++++-
 2 files changed, 40 insertions(+), 1 deletion(-)

diff --git a/scripts/tests/test_validate_docstrings.py b/scripts/tests/test_validate_docstrings.py
index fcae4051dc471..6bf832fb9dc6d 100644
--- a/scripts/tests/test_validate_docstrings.py
+++ b/scripts/tests/test_validate_docstrings.py
@@ -334,6 +334,33 @@ def method(self, foo=None, bar=None):
         pass
 
 
+class BadSeeAlso(object):
+
+    def desc_no_period(self):
+        """
+        Return the first 5 elements of the Series.
+
+        See Also
+        --------
+        Series.tail : Return the last 5 elements of the Series.
+        Series.iloc : Return a slice of the elements in the Series,
+            which can also be used to return the first or last n
+        """
+        pass
+
+    def desc_first_letter_lowercase(self):
+        """
+        Return the first 5 elements of the Series.
+
+        See Also
+        --------
+        Series.tail : return the last 5 elements of the Series.
+        Series.iloc : Return a slice of the elements in the Series,
+            which can also be used to return the first or last n.
+        """
+        pass
+
+
 class BadSummaries(object):
 
     def wrong_line(self):
@@ -608,6 +635,11 @@ def test_bad_generic_functions(self, func):
         assert errors
 
     @pytest.mark.parametrize("klass,func,msgs", [
+        # See Also tests
+        ('BadSeeAlso', 'desc_no_period',
+         ('Missing period at end of description for See Also "Series.iloc"',)),
+        ('BadSeeAlso', 'desc_first_letter_lowercase',
+         ('should be capitalized for See Also "Series.tail"',)),
         # Summary tests
         ('BadSummaries', 'wrong_line',
          ('should start in the line immediately after the opening quotes',)),
diff --git a/scripts/validate_docstrings.py b/scripts/validate_docstrings.py
index c571827db70f8..2fef3332de55c 100755
--- a/scripts/validate_docstrings.py
+++ b/scripts/validate_docstrings.py
@@ -505,7 +505,14 @@ def validate_one(func_name):
         wrns.append('See Also section not found')
     else:
         for rel_name, rel_desc in doc.see_also.items():
-            if not rel_desc:
+            if rel_desc:
+                if not rel_desc.endswith('.'):
+                    errs.append('Missing period at end of description for '
+                                'See Also "{}" reference'.format(rel_name))
+                if not rel_desc[0].isupper():
+                    errs.append('Description should be capitalized for '
+                                'See Also "{}" reference'.format(rel_name))
+            else:
                 errs.append('Missing description for '
                             'See Also "{}" reference'.format(rel_name))